{ "nbformat": 4, "nbformat_minor": 0, "metadata": { "colab": { "provenance": [], "machine_shape": "hm", "gpuType": "T4" }, "kernelspec": { "name": "python3", "display_name": "Python 3" }, "language_info": { "name": "python" }, "accelerator": "GPU", "widgets": { "application/vnd.jupyter.widget-state+json": { "e5e2a14ad13b4dfb8ecf38397a645c31": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_448fd18a7e0942e2af6a4062fcee5ec0", "IPY_MODEL_0f8e568fa21d4d74908b1e3676db60c1", "IPY_MODEL_ba0a4c5990d44a189ca0215690d264da" ], "layout": "IPY_MODEL_d1288e87cb3d44419b0952d2b3eee9f7" } }, "448fd18a7e0942e2af6a4062fcee5ec0": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_7fa34b2bb77d4fd78980c00857d740f5", "placeholder": "​", "style": "IPY_MODEL_8d59d79aa8f94360ba0037a24a89735a", "value": "100%" } }, "0f8e568fa21d4d74908b1e3676db60c1": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c9e399f106b54f82aff75da26119a20a", "max": 2, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_782ed4211774400a85e5742fcb7e4ec9", "value": 2 } }, "ba0a4c5990d44a189ca0215690d264da": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_9918f25201f145c1a5933d2ff27f8023", "placeholder": "​", "style": "IPY_MODEL_e785d4da0eca49a2a96aee6b8ec25080", "value": " 2/2 [00:00<00:00, 83.56it/s]" } }, "d1288e87cb3d44419b0952d2b3eee9f7": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "7fa34b2bb77d4fd78980c00857d740f5": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "8d59d79aa8f94360ba0037a24a89735a": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "c9e399f106b54f82aff75da26119a20a": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "782ed4211774400a85e5742fcb7e4ec9": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "9918f25201f145c1a5933d2ff27f8023": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "e785d4da0eca49a2a96aee6b8ec25080": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "2979cc614ea7448b8575d09fab4959d0": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_78d5deb4cbf74aabaae89a42ceee72eb", "IPY_MODEL_da7f9d8912fd403e85379419cd518023", "IPY_MODEL_1564a0d3efc0455bae2c3d90325a4571" ], "layout": "IPY_MODEL_734777f838be43f0b3e9c954e393d691" } }, "78d5deb4cbf74aabaae89a42ceee72eb": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_df64aa40c8e0419f87075288d9383483", "placeholder": "​", "style": "IPY_MODEL_ca7be44dc07d41829a2d3525ad0cb63c", "value": "Map: 100%" } }, "da7f9d8912fd403e85379419cd518023": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_003d9c73437542dd9c4c59a3730ef696", "max": 9094, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_bfb2829000de43028c4922ecf2344134", "value": 9094 } }, "1564a0d3efc0455bae2c3d90325a4571": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ce74e7478bef4ca987232389d94a89ee", "placeholder": "​", "style": "IPY_MODEL_1e8b918d21ea44268fb1112f8fd1007f", "value": " 9094/9094 [00:24<00:00, 363.60 examples/s]" } }, "734777f838be43f0b3e9c954e393d691": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": "hidden", "width": null } }, "df64aa40c8e0419f87075288d9383483": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "ca7be44dc07d41829a2d3525ad0cb63c": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "003d9c73437542dd9c4c59a3730ef696": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "bfb2829000de43028c4922ecf2344134": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "ce74e7478bef4ca987232389d94a89ee": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "1e8b918d21ea44268fb1112f8fd1007f": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } } } } }, "cells": [ { "cell_type": "code", "source": [ "!pip install datasets\n", "!pip install transformers" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "3pCTD5isFrhN", "outputId": "23d51816-5b1e-415d-8c2f-32c9e2033684" }, "execution_count": 1, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Requirement already satisfied: datasets in /usr/local/lib/python3.10/dist-packages (2.13.1)\n", "Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from datasets) (1.22.4)\n", "Requirement already satisfied: pyarrow>=8.0.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (9.0.0)\n", "Requirement already satisfied: dill<0.3.7,>=0.3.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (0.3.6)\n", "Requirement already satisfied: pandas in /usr/local/lib/python3.10/dist-packages (from datasets) (1.5.3)\n", "Requirement already satisfied: requests>=2.19.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (2.27.1)\n", "Requirement already satisfied: tqdm>=4.62.1 in /usr/local/lib/python3.10/dist-packages (from datasets) (4.65.0)\n", "Requirement already satisfied: xxhash in /usr/local/lib/python3.10/dist-packages (from datasets) (3.2.0)\n", "Requirement already satisfied: multiprocess in /usr/local/lib/python3.10/dist-packages (from datasets) (0.70.14)\n", "Requirement already satisfied: fsspec[http]>=2021.11.1 in /usr/local/lib/python3.10/dist-packages (from datasets) (2023.6.0)\n", "Requirement already satisfied: aiohttp in /usr/local/lib/python3.10/dist-packages (from datasets) (3.8.4)\n", "Requirement already satisfied: huggingface-hub<1.0.0,>=0.11.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (0.16.4)\n", "Requirement already satisfied: packaging in /usr/local/lib/python3.10/dist-packages (from datasets) (23.1)\n", "Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from datasets) (6.0.1)\n", "Requirement already satisfied: attrs>=17.3.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (23.1.0)\n", "Requirement already satisfied: charset-normalizer<4.0,>=2.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (2.0.12)\n", "Requirement already satisfied: multidict<7.0,>=4.5 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (6.0.4)\n", "Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (4.0.2)\n", "Requirement already satisfied: yarl<2.0,>=1.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.9.2)\n", "Requirement already satisfied: frozenlist>=1.1.1 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.4.0)\n", "Requirement already satisfied: aiosignal>=1.1.2 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.3.1)\n", "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0.0,>=0.11.0->datasets) (3.12.2)\n", "Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0.0,>=0.11.0->datasets) (4.7.1)\n", "Requirement already satisfied: urllib3<1.27,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests>=2.19.0->datasets) (1.26.16)\n", "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests>=2.19.0->datasets) (2023.5.7)\n", "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests>=2.19.0->datasets) (3.4)\n", "Requirement already satisfied: python-dateutil>=2.8.1 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets) (2.8.2)\n", "Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets) (2022.7.1)\n", "Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.10/dist-packages (from python-dateutil>=2.8.1->pandas->datasets) (1.16.0)\n", "Requirement already satisfied: transformers in /usr/local/lib/python3.10/dist-packages (4.31.0)\n", "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from transformers) (3.12.2)\n", "Requirement already satisfied: huggingface-hub<1.0,>=0.14.1 in /usr/local/lib/python3.10/dist-packages (from transformers) (0.16.4)\n", "Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from transformers) (1.22.4)\n", "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from transformers) (23.1)\n", "Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from transformers) (6.0.1)\n", "Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.10/dist-packages (from transformers) (2022.10.31)\n", "Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from transformers) (2.27.1)\n", "Requirement already satisfied: tokenizers!=0.11.3,<0.14,>=0.11.1 in /usr/local/lib/python3.10/dist-packages (from transformers) (0.13.3)\n", "Requirement already satisfied: safetensors>=0.3.1 in /usr/local/lib/python3.10/dist-packages (from transformers) (0.3.1)\n", "Requirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.10/dist-packages (from transformers) (4.65.0)\n", "Requirement already satisfied: fsspec in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.14.1->transformers) (2023.6.0)\n", "Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.14.1->transformers) (4.7.1)\n", "Requirement already satisfied: urllib3<1.27,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (1.26.16)\n", "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (2023.5.7)\n", "Requirement already satisfied: charset-normalizer~=2.0.0 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (2.0.12)\n", "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (3.4)\n" ] } ] }, { "cell_type": "code", "source": [ "pip install transformers[torch]" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "GTagr5gdU_Xh", "outputId": "a24eca2e-877a-44ef-a1c5-48db45565372" }, "execution_count": 2, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Requirement already satisfied: transformers[torch] in /usr/local/lib/python3.10/dist-packages (4.31.0)\n", "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (3.12.2)\n", "Requirement already satisfied: huggingface-hub<1.0,>=0.14.1 in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (0.16.4)\n", "Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (1.22.4)\n", "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (23.1)\n", "Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (6.0.1)\n", "Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (2022.10.31)\n", "Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (2.27.1)\n", "Requirement already satisfied: tokenizers!=0.11.3,<0.14,>=0.11.1 in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (0.13.3)\n", "Requirement already satisfied: safetensors>=0.3.1 in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (0.3.1)\n", "Requirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (4.65.0)\n", "Requirement already satisfied: torch!=1.12.0,>=1.9 in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (2.0.1+cu118)\n", "Requirement already satisfied: accelerate>=0.20.3 in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (0.21.0)\n", "Requirement already satisfied: psutil in /usr/local/lib/python3.10/dist-packages (from accelerate>=0.20.3->transformers[torch]) (5.9.5)\n", "Requirement already satisfied: fsspec in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.14.1->transformers[torch]) (2023.6.0)\n", "Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.14.1->transformers[torch]) (4.7.1)\n", "Requirement already satisfied: sympy in /usr/local/lib/python3.10/dist-packages (from torch!=1.12.0,>=1.9->transformers[torch]) (1.11.1)\n", "Requirement already satisfied: networkx in /usr/local/lib/python3.10/dist-packages (from torch!=1.12.0,>=1.9->transformers[torch]) (3.1)\n", "Requirement already satisfied: jinja2 in /usr/local/lib/python3.10/dist-packages (from torch!=1.12.0,>=1.9->transformers[torch]) (3.1.2)\n", "Requirement already satisfied: triton==2.0.0 in /usr/local/lib/python3.10/dist-packages (from torch!=1.12.0,>=1.9->transformers[torch]) (2.0.0)\n", "Requirement already satisfied: cmake in /usr/local/lib/python3.10/dist-packages (from triton==2.0.0->torch!=1.12.0,>=1.9->transformers[torch]) (3.25.2)\n", "Requirement already satisfied: lit in /usr/local/lib/python3.10/dist-packages (from triton==2.0.0->torch!=1.12.0,>=1.9->transformers[torch]) (16.0.6)\n", "Requirement already satisfied: urllib3<1.27,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->transformers[torch]) (1.26.16)\n", "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->transformers[torch]) (2023.5.7)\n", "Requirement already satisfied: charset-normalizer~=2.0.0 in /usr/local/lib/python3.10/dist-packages (from requests->transformers[torch]) (2.0.12)\n", "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->transformers[torch]) (3.4)\n", "Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.10/dist-packages (from jinja2->torch!=1.12.0,>=1.9->transformers[torch]) (2.1.3)\n", "Requirement already satisfied: mpmath>=0.19 in /usr/local/lib/python3.10/dist-packages (from sympy->torch!=1.12.0,>=1.9->transformers[torch]) (1.3.0)\n" ] } ] }, { "cell_type": "code", "source": [ "pip install accelerate" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "W79jQrLDVa5y", "outputId": "c24ba2aa-af11-4f81-e4ac-e2b603b14549" }, "execution_count": 3, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Requirement already satisfied: accelerate in /usr/local/lib/python3.10/dist-packages (0.21.0)\n", "Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from accelerate) (1.22.4)\n", "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from accelerate) (23.1)\n", "Requirement already satisfied: psutil in /usr/local/lib/python3.10/dist-packages (from accelerate) (5.9.5)\n", "Requirement already satisfied: pyyaml in /usr/local/lib/python3.10/dist-packages (from accelerate) (6.0.1)\n", "Requirement already satisfied: torch>=1.10.0 in /usr/local/lib/python3.10/dist-packages (from accelerate) (2.0.1+cu118)\n", "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from torch>=1.10.0->accelerate) (3.12.2)\n", "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.10/dist-packages (from torch>=1.10.0->accelerate) (4.7.1)\n", "Requirement already satisfied: sympy in /usr/local/lib/python3.10/dist-packages (from torch>=1.10.0->accelerate) (1.11.1)\n", "Requirement already satisfied: networkx in /usr/local/lib/python3.10/dist-packages (from torch>=1.10.0->accelerate) (3.1)\n", "Requirement already satisfied: jinja2 in /usr/local/lib/python3.10/dist-packages (from torch>=1.10.0->accelerate) (3.1.2)\n", "Requirement already satisfied: triton==2.0.0 in /usr/local/lib/python3.10/dist-packages (from torch>=1.10.0->accelerate) (2.0.0)\n", "Requirement already satisfied: cmake in /usr/local/lib/python3.10/dist-packages (from triton==2.0.0->torch>=1.10.0->accelerate) (3.25.2)\n", "Requirement already satisfied: lit in /usr/local/lib/python3.10/dist-packages (from triton==2.0.0->torch>=1.10.0->accelerate) (16.0.6)\n", "Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.10/dist-packages (from jinja2->torch>=1.10.0->accelerate) (2.1.3)\n", "Requirement already satisfied: mpmath>=0.19 in /usr/local/lib/python3.10/dist-packages (from sympy->torch>=1.10.0->accelerate) (1.3.0)\n" ] } ] }, { "cell_type": "markdown", "source": [ "## Steps\n", "\n", "1. prepare dataset\n", "2. load pretrained Tokenizer, call it with dataset -> encoding\n", "3. build PyTorch Dataset with encodings\n", "4. Load pretrained Model\n", "5. a. Load Trainer and train it\n", " b. or use naive Pytorch training pipeline" ], "metadata": { "id": "rzk_Q6ACfTIl" } }, { "cell_type": "markdown", "source": [ "## Pretrained model for patentability from Hugging face" ], "metadata": { "id": "EALuEZYSJozD" } }, { "cell_type": "code", "source": [ "model_name = 'distilbert-base-uncased' #'AI-Growth-Lab/PatentSBERTa'" ], "metadata": { "id": "Ds0R-Aacnxj1" }, "execution_count": 4, "outputs": [] }, { "cell_type": "markdown", "source": [ "## Import libraries and pretrained model" ], "metadata": { "id": "cPjlmk7aFwkR" } }, { "cell_type": "code", "source": [ "# Pretty print\n", "from pprint import pprint\n", "# Datasets load_dataset function\n", "from datasets import load_dataset\n", "# Transformers Autokenizer\n", "from transformers import AutoTokenizer, AutoModelForSequenceClassification, DistilBertForSequenceClassification\n", "tokenizer = AutoTokenizer.from_pretrained(model_name)\n", "# Standard PyTorch DataLoader\n", "from torch.utils.data import DataLoader\n", "\n", "from transformers import pipeline, Trainer, TrainingArguments\n", "\n", "\n", "import torch\n", "import torch.nn.functional as F\n", "\n", "from transformers import logging\n", "\n", "logging.set_verbosity_warning()" ], "metadata": { "id": "FxZeFFTlFvz1" }, "execution_count": 5, "outputs": [] }, { "cell_type": "markdown", "source": [ "## Download Dataset (USPTO)" ], "metadata": { "id": "jDVxfOsznnQP" } }, { "cell_type": "markdown", "source": [ "use the `load_dataset` function to load all the patent applications that were filed to the USPTO in January 2016. We specify the date ranges of the training and validation sets as January 1-21, 2016 and January 22-31, 2016, respectively." ], "metadata": { "id": "JtxpuQV7F712" } }, { "cell_type": "code", "source": [ "dataset_dict = load_dataset('HUPD/hupd',\n", " name='sample',\n", " data_files=\"https://huggingface.co/datasets/HUPD/hupd/blob/main/hupd_metadata_2022-02-22.feather\",\n", " icpr_label=None,\n", " train_filing_start_date='2016-01-01',\n", " train_filing_end_date='2016-01-21',\n", " val_filing_start_date='2016-01-22',\n", " val_filing_end_date='2016-01-31',\n", ")\n", "\n", "print('Loading is done!')" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 104, "referenced_widgets": [ "e5e2a14ad13b4dfb8ecf38397a645c31", "448fd18a7e0942e2af6a4062fcee5ec0", "0f8e568fa21d4d74908b1e3676db60c1", "ba0a4c5990d44a189ca0215690d264da", "d1288e87cb3d44419b0952d2b3eee9f7", "7fa34b2bb77d4fd78980c00857d740f5", "8d59d79aa8f94360ba0037a24a89735a", "c9e399f106b54f82aff75da26119a20a", "782ed4211774400a85e5742fcb7e4ec9", "9918f25201f145c1a5933d2ff27f8023", "e785d4da0eca49a2a96aee6b8ec25080" ] }, "id": "pIDmYbLGF1a7", "outputId": "8e8b6ba8-e4db-4ff3-9275-f20cd9bada92" }, "execution_count": 6, "outputs": [ { "output_type": "stream", "name": "stderr", "text": [ "WARNING:datasets.builder:Found cached dataset hupd (/root/.cache/huggingface/datasets/HUPD___hupd/sample-bf35d7d92b870122/0.0.0/6920d2def8fd7767046c0470603357f76866e5a09c97e19571896bfdca521142)\n" ] }, { "output_type": "display_data", "data": { "text/plain": [ " 0%| | 0/2 [00:00 BACKGROUND OF THE INVENTION A network interface device permits a subscriber to access a network. A passive optical network (PON) is an example of a network capable of delivering voice, video and other data among multiple network subscribers, using a common optical fiber link. Passive optical splitters and combiners enable multiple optical network terminals (ONTs) to share the optical fiber link. In a PON, each ONT terminates the optical fiber link for a residential or business subscriber, and is sometimes referred to as a subscriber premises node that delivers Fiber to the Premises (FTTP) services. An ONT is connected to one or more subscriber devices, such as televisions, set-top boxes, telephones, computers, or network appliances, which ultimately receive the voice, video and data delivered vii the PON. An ONT is an example of a network interface, device. Other examples of a network interface device, in different network types, include cable modems and digital subscriber line (DSL) boxes. Generally, a network also includes a network access interface. In a PON, the network access interface is sometimes referred to as an optical line terminator (OLT), having multiple, independent PON interface modules that serve multiple optical fiber links. A PON interface module provides an interface for transmission and reception of data packets over a particular optical fiber link that serves a group of ONTs. A PON is a downstream-multicast medium. Each packet transmitted on an optical fiber link can be received by every ONT served by that link. ONTs identify selected packets or frames on the fiber link based on addressing information included within the packets or frames. Network equipment, such as network interface devices, in a cable or hybrid network may be connected to power provided by a central office (CO), which commonly utilizes battery and generator back-up power to maintain a continuous power supply. In contrast, an ONT in an all-fiber optic network is ordinarily powered locally at the subscriber premises. For this reason, an ONT often includes a battery to provide backup power during a power outage to maintain critical services, such as voice service. Conventionally, the fibre of a PON typically terminates at a street cabinet to be shared by a number of subscriber equipment. The street cabinet houses an optical network terminal (ONT). The last few meters or kilometer from the street cabinet to a subscriber's home is typically bridged using existing twisted pair copper cables or radio links. The bandwidth resources of the fibre to the street cabinet are typically shared amongst a group of subscribers using an Ethernet switch. For example the fibre may extend to a street cabinet, a kerb outside a subscribers home, or directly into the subscribers home itself. Due to the bulkiness, size and complexity of the ONT cabinets are all factors that increase design difficulty and accrue additional costs. Also, the ONT itself is valuable, and its mounting on a wall, especially outside, makes it susceptible to theft or to being accidentally knocked down. Therefore, it would be desirable to have a compact optical network terminal to make passive optical networks seamlessly connected to regular computers and any other systems to overcome the above restrictions.\"],\n", " 'summary': [' SUMMARY OF THE INVENTION An aspect of the present invention is to address at least the above-mentioned problems and/or disadvantages and to provide at least the advantages described below. Accordingly, an aspect of the present invention is to provide a compact optical network terminal, comprising a first interface coupled to a communications network, a second interface coupled to a network client and a processor including a circuitry and a memory coupled to the first interface and to the second interface, wherein the processor is capable of converting optical signals to electric signals, such that the network client can access the communications network. Other aspects, advantages, and salient features of the invention will become apparent to those skilled in the art from the following detailed description, which, taken in conjunction with the annexed drawings, discloses exemplary embodiments of the invention.'],\n", " 'description': [\"FIELD OF THE INVENTION The present invention relates to the field of passive optical network (PON), and in particular, to an optical network terminal (ONT) in the PON system. BACKGROUND OF THE INVENTION A network interface device permits a subscriber to access a network. A passive optical network (PON) is an example of a network capable of delivering voice, video and other data among multiple network subscribers, using a common optical fiber link. Passive optical splitters and combiners enable multiple optical network terminals (ONTs) to share the optical fiber link. In a PON, each ONT terminates the optical fiber link for a residential or business subscriber, and is sometimes referred to as a subscriber premises node that delivers Fiber to the Premises (FTTP) services. An ONT is connected to one or more subscriber devices, such as televisions, set-top boxes, telephones, computers, or network appliances, which ultimately receive the voice, video and data delivered vii the PON. An ONT is an example of a network interface, device. Other examples of a network interface device, in different network types, include cable modems and digital subscriber line (DSL) boxes. Generally, a network also includes a network access interface. In a PON, the network access interface is sometimes referred to as an optical line terminator (OLT), having multiple, independent PON interface modules that serve multiple optical fiber links. A PON interface module provides an interface for transmission and reception of data packets over a particular optical fiber link that serves a group of ONTs. A PON is a downstream-multicast medium. Each packet transmitted on an optical fiber link can be received by every ONT served by that link. ONTs identify selected packets or frames on the fiber link based on addressing information included within the packets or frames. Network equipment, such as network interface devices, in a cable or hybrid network may be connected to power provided by a central office (CO), which commonly utilizes battery and generator back-up power to maintain a continuous power supply. In contrast, an ONT in an all-fiber optic network is ordinarily powered locally at the subscriber premises. For this reason, an ONT often includes a battery to provide backup power during a power outage to maintain critical services, such as voice service. Conventionally, the fibre of a PON typically terminates at a street cabinet to be shared by a number of subscriber equipment. The street cabinet houses an optical network terminal (ONT). The last few meters or kilometer from the street cabinet to a subscriber's home is typically bridged using existing twisted pair copper cables or radio links. The bandwidth resources of the fibre to the street cabinet are typically shared amongst a group of subscribers using an Ethernet switch. For example the fibre may extend to a street cabinet, a kerb outside a subscribers home, or directly into the subscribers home itself. Due to the bulkiness, size and complexity of the ONT cabinets are all factors that increase design difficulty and accrue additional costs. Also, the ONT itself is valuable, and its mounting on a wall, especially outside, makes it susceptible to theft or to being accidentally knocked down. Therefore, it would be desirable to have a compact optical network terminal to make passive optical networks seamlessly connected to regular computers and any other systems to overcome the above restrictions. SUMMARY OF THE INVENTION An aspect of the present invention is to address at least the above-mentioned problems and/or disadvantages and to provide at least the advantages described below. Accordingly, an aspect of the present invention is to provide a compact optical network terminal, comprising a first interface coupled to a communications network, a second interface coupled to a network client and a processor including a circuitry and a memory coupled to the first interface and to the second interface, wherein the processor is capable of converting optical signals to electric signals, such that the network client can access the communications network. Other aspects, advantages, and salient features of the invention will become apparent to those skilled in the art from the following detailed description, which, taken in conjunction with the annexed drawings, discloses exemplary embodiments of the invention. BRIEF DESCRIPTION OF THE DRAWINGS The above and other aspects, features, and advantages of certain exemplary embodiments of the present invention will be more apparent from the following description taken in conjunction with the accompanying drawings in which: FIG. 1A is a mechanical diagram of an optical network terminal (ONT) typical of customer premises equipment (CPE). FIG. 1B is a mechanical diagram of the ONT of FIG. 1A attached to a mounting bracket. FIG. 2 shows a typical Passive Optical Network (PON) Architecture. FIG. 3 shows a compatible optical network terminal (ONT) according to one embodiment of the present invention. FIG. 4 is a diagrammatic system view of a data processing system in which any of the embodiments disclosed herein may be performed. Persons skilled in the art will appreciate that elements in the figures are illustrated for simplicity and clarity and may have not been drawn to scale. For example, the dimensions of some of the elements in the figure may be exaggerated relative to other elements to help to improve understanding of various exemplary embodiments of the present disclosure. Throughout the drawings, it should be noted that like reference numbers are used to depict the same or similar elements, features, and structures. DETAIL DESCRIPTION OF THE INVENTION The following description with reference to the accompanying drawings is provided to assist in a comprehensive understanding of exemplary embodiments of the invention as defined by the claims and their equivalents. It includes various specific details to assist in that understanding but′ these are to be regarded as merely exemplary. Accordingly, those of ordinary skill in the art will recognize that various changes and modifications of the embodiments described herein can be made without departing from the scope and spirit of the invention. In addition, descriptions of well-known functions and constructions are omitted for clarity and conciseness. The terms and words used in the following description and claims are not limited to the bibliographical meanings, but, are merely used by the inventor to enable a clear and consistent understanding of the invention. Accordingly, it should be apparent to those skilled in the art that the following description of exemplary embodiments of the present invention are provided for illustration purpose only and not for the purpose of limiting the invention as defined by the appended claims and their equivalents. It is to be understood that the singular forms “a,” “an,” and “the” include plural referents unless the context clearly dictates otherwise. Thus, for example, reference to “a component surface” includes reference to one or more of such surfaces. By the term “substantially” it is meant that the recited characteristic, parameter, or value need not be achieved exactly, but that deviations or variations, including for example, tolerances, measurement error, measurement accuracy limitations and other factors known to those of skill in the art, may occur in amounts that do not preclude the effect the characteristic was intended to provide. FIGS. 1 through 4, discussed below, and the various embodiments used to describe the principles of the present disclosure in this patent document are by way of illustration only and should not be construed in any way that would limit the scope of the disclosure. Those skilled in the art will understand that the principles of the present disclosure may be implemented in any suitably arranged communications system. The terms used to describe various embodiments are exemplary. It should be understood that these are provided to merely aid the understanding of the description, and that their use and definitions in no way limit the scope of the invention. Terms first, second, and the like are used to differentiate between objects having the same terminology and are in no way intended to represent a chronological order, unless where explicitly stated otherwise. A set is defined as a non-empty set including at least one element. FIG. 1A shows an optical network terminal (ONT) 100, which is an example of customer premises equipment (CPE), that connects a customer's communications equipment, e.g., computers, telephones, and televisions, to a telecommunications service provider. The ONT 100 includes an outer case 102 with an engagable cover 104 that covers a battery compartment (not shown) or another cavity of the ONT 100. A face 106 of the ONT 100 carries various connectors, including a power connector 108, coaxial cable connector 110, fiber optic cable connector 112, Ethernet (CAT-5) connector 114, and two telephone connectors 116. The ONT 100 transmits data to and receives data from a telecommunications network (not shown) via a fiber optic cable (not shown) connected to a fiber optic cable connector 112. Televisions, computers, and telephones on the customer's premises may be connected to the coaxial cable connector 110, Ethernet connector 114, and telephone connectors 116, respectively, on the ONT 100. FIG. 1B shows the ONT 100 of FIG. 1A with connector details with a bracket 120 attached to the outer case 102. The bracket 120 may be mounted to a wall (not shown), and the ONT 100 may be hung on the bracket. In many applications, the bracket 120 is installed on an exterior wall of a building or inside a garage, locations at which the ONT may be exposed to large temperature variations and different weather conditions. FIG. 2 shows a general Passive Optical Network (PON) Architecture. The elements of a PON are (i) Optical Line Terminal (OLT) 210 (ii) Passive Optical Splitter 220 and (iii) Optical Network Unit (ONU) 230. The Optical Line Terminal 210 is the main element of the network and is usually placed in the Local Exchange. It is a network element with PON line card, basically a aggregation switch. It works as an interface between core network and PON network. Optical Splitter 220 is a passive device with single input and multiple outputs. Optical power at input is split evenly between outputs. Not only signal travels from input to the outputs, signal can also travel from the output to the input. Splitters can be placed anywhere in between Central Office (CO) and Subscriber premises. It is used to connect an optical port of OLT with multiple subscribers. Optical Network units (ONUs) 230 serve as an interface to the network and are deployed at customer premises 240. It provides several interfaces for accessing triple play services and in the upper side it connects with the OLT via optical splitter. Although PONs can exist in three basic configuration (tree, bus and ring), the tree topology is favored due to smaller variation in the signal power from different end station. PON uses 1490 nm for the downstream wavelength and 1310 nm for the upstream wavelength. Signals are inserted or extracted from the fibre using a coarse wavelength division multiplexer (CWDM) filter at the CO and subscriber premises. FIG. 3 shows a compatible optical network terminal (ONT) according to one embodiment of the present invention. The optical network terminal (ONT) 300 includes a first interface 310, a second interface 320 and a middle region 330 sandwiched between the first and second interface. The first interface 310 coupled to a communications network 340, a second interface 320 coupled to a network client 350. The first interface is connected through a dedicated optical fiber link 360 (bi-directional) to receive optical signals from one or more communication network 340. The communication network may be or may include one or more but not limited to any of the xPON network 340 (e.g. of a broadband passive optical network (BPON), a gigabit-capable passive optical network (GPON), an Ethernet passive optical network (EPON), a gigabit-capable Ethernet passive optical network (GEPON), an active Ethernet optical network and any other future passive optical networks etc). The second interface 320 is coupled to the network client 350 though a USB port. In an operation, the middle region which may be a processor 330 including a memory (not shown in figure) coupled to the first interface 310 and to the second interface 320, wherein the processor 330 includes a circuitry which is configured for converting optical signals to electric signals, such that the network client can access the communications network. The first interface 310 may include an optical module (not shown in figure) which receives optical signals via the optical fiber link 360 and capable of converting the optical signals to electrical signals. The second interface 320 may include a control circuit (not shown in figure) which is capable of receiving the power from the network client 350 for processing the received electrical signals thereby reducing the required protocol processing time from the network client. Due to this behavior of the second interface 320 results in simplifying the ONT design by offloading the “non-volatile” part of the software to the network client 350 and downloading it on power to turn it. Most of the backend work can also be done by a software driver residing in the network client. Further, the second interface 320 acts as a network connectivity dongle with an optical transceiver at one end. Furthermore, the second interface may include a Universal Serial Bus (USB) jack which is couplable to Universal Serial Bus (USB) plug or connector of the network client 350. The second interface 320 capable of power up the “dongle” to connect it to the central office or Optical Line Terminal (OLT) by excluding external power source as required in the conventional design of ONT. In an example operation the Optical Network Terminal. (ONT) is connected to the network client through a USB port. Once the USB port of the network client 360 is coupled to the USB interface i.e. second interface 320, one or more driver needs to be installed at the network client 360 which then onwards controls the USB dongle (ONT) with the configured parameters at the installation time. The software boots up the USB dongle and communicates to network client 360 as a memory device with a built-in driver. The xPON protocol selected at the network client 360 will run and then converts the data coming from the WAN/LAN side to network client 360 as a network device. Once the software starts running in the network client 360, it would get connected to the OLT using the required xPON protocol. Once the network client 360 and the xPON network are connected, each network client 360 will have a dedicated connection (e.g. speed, bandwidth etc) as requested or selected by the client side. By this kind of novel and compatible design i.e. having xPON interface on one side and USB protocol interface on the other side will eradicate the necessity of the external power for the ONT. Also, by this kind of compatible design reduce the unnecessary splitting of equal upstream wavelength to all the network clients in the network. The network client may be or may include a host computer, a optical network unit, a optical network terminal or any other unit or terminal or device which is capable of accessing the passive optical network (xPON). FIG. 4 is a diagrammatic system view 400 of a data processing system in which any of the embodiments disclosed herein may be performed, according to one embodiment. Particularly, the diagrammatic system view of FIG. 4 illustrates a processor 402, a main memory 404, a static memory 406, a bus 408, a video display 410, an alpha-numeric input device 412, a cursor control device 414, a drive unit 416, a signal generation device 418, a network interface device 420, a machine readable medium 422, instructions 424 and a network 426. The diagrammatic system view 400 may indicate a personal computer and/or a data processing system in which one or more operations disclosed herein are performed. The processor 402 may be a microprocessor, a state machine, an application specific integrated circuit, a field programmable gate array; etc. (e.g., Intel® Pentium® processor). The main memory 404 may be a dynamic random access memory and/or a primary memory of a computer system. The static memory 406 may be a hard drive, a flash drive, and/or other memory information associated with the data processing system. The bus 408 may be an interconnection between various circuits and/or structures of the data processing system. The video display 410 may provide graphical representation of information on the data processing system. The alpha-numeric input device 412 may be a keypad, keyboard and/or any other input device of text (e.g., a special device to aid the physically handicapped). The cursor control device 414 may be a pointing device such as a mouse. The drive unit 416 may be a hard drive, a storage system, and/or other longer term storage subsystem. The signal generation device 418 may be a bios and/or a functional operating system of the data processing system. The network interface device 420 may perform interface functions (e.g., code conversion, protocol conversion, and/or buffering) required for communications to and from the network 426 between a number of independent devices (e.g., of varying protocols). The machine readable medium 422 may provide instructions on which any of the methods disclosed herein may be performed. The instructions 424 may provide source code and/or data code to the processor 402 to enable any one/or more operations disclosed herein. FIGS. 1-4 are merely representational and are not drawn to scale. Certain portions thereof may be exaggerated, while others may be minimized. FIGS. 1-4 illustrate various embodiments of the invention that can be understood and appropriately carried out by those of ordinary skill in the art. In the foregoing detailed description of embodiments of the invention, various features are grouped together in a single embodiment for the purpose of streamlining the disclosure. This method of disclosure is not to be interpreted as reflecting an intention that the claimed embodiments of the invention require more features than are expressly recited in each claim. Rather, as the following claims reflect, inventive subject matter lies in less than all features of a single disclosed embodiment. Thus, the following claims are hereby incorporated into the detailed description of embodiments of the invention, with each claim standing on its own as a separate embodiment. It is understood that the above description is intended to be illustrative, and not restrictive. It is intended to cover all alternatives, modifications and equivalents as may be included within the spirit and scope of the invention as defined in the appended claims. Many other embodiments will be apparent to those of skill in the art upon reviewing the above description. The scope of the invention should, therefore, be determined with reference to the appended claims, along with the full scope of equivalents to which such claims are entitled. In the appended claims, the terms “including” and “in which” are used as the plain-English equivalents of the respective terms “comprising” and “wherein,” respectively.\"],\n", " 'cpc_label': ['H04Q110071'],\n", " 'ipc_label': ['H04Q1100'],\n", " 'filing_date': ['20160120'],\n", " 'patent_issue_date': ['20170606'],\n", " 'date_published': ['20160526'],\n", " 'examiner_id': ['95191.0']}" ] }, "metadata": {}, "execution_count": 10 } ] }, { "cell_type": "code", "source": [ "train_dict[0]['claims']" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 140 }, "id": "jDBvcgmP5Puh", "outputId": "f4f73693-11f7-4918-a86d-2912e863b151" }, "execution_count": 11, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "'1. A compact optical network terminal, comprising: a first interface coupled to a communications network; a second interface coupled to a network client, wherein the second interface is a network connectivity dongle with an optical transceiver at one end; and a processor including a circuitry and a memory coupled to the first interface and to the second interface, wherein the processor is capable of converting optical signals to electric signals, such that the network client can access the communications network thereby reducing the unnecessary splitting of equal upstream wavelengths to all the network clients in the network. 2. The optical network terminal of claim 1, wherein the first interface includes an optical module that receives optical signals via the optical fiber link and converts the optical signals to electrical signals. 3. The optical network terminal of claim 2, wherein the optical module is selectively configurable to support two or more of a broadband passive optical network (BPON), a gigabit-capable passive optical network (GPON), an Ethernet passive optical network (EPON), a gigabit-capable Ethernet passive optical network (GEPON) and an active Ethernet optical network. 4. The optical network terminal of claim 1, wherein the network client includes a converter unit for converting at least some of the electrical signals to data units which is selectively configurable to support a plurality of optical network protocols. 5. The optical, network terminal of claim 1, wherein the second interface includes a control circuitry which is capable of receiving the power from the network client for processing the received electrical signals thereby reducing the required protocol processing time from the network client. 6. The optical network terminal of claim 1, wherein the network client is capable of processing the xPON protocols to communicate with one or more Optical Line Terminal (OLT). 7. (canceled) 8. The optical network terminal of claim 1, wherein the second interface includes a Universal Serial Bus (USB) jack which is couplable to Universal Serial Bus (USB) plug or connector of the network client. 9. The optical network terminal of claim 1, wherein the at least one communication service with the xPON network comprises a first communication service and a second communication service, and wherein the communication service includes at least one voice communication service, a data communication service, and a video service. 10. (canceled)'" ], "application/vnd.google.colaboratory.intrinsic+json": { "type": "string" } }, "metadata": {}, "execution_count": 11 } ] }, { "cell_type": "code", "source": [ "train_dict[0]['abstract']" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 87 }, "id": "sBhSPSV-5XKS", "outputId": "0057e051-3b36-4705-8636-19e7850fa0a9" }, "execution_count": 12, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "'The present invention relates to passive optical network (PON), and in particular, to an optical network terminal (ONT) in the PON system. In one embodiment, the optical network terminal includes a first interface coupled to a communications network, a second interface coupled to a network client and a processor including a memory coupled to the first interface and to the second interface, wherein the processor is capable of converting optical signals to electric signals, such that the network client can access the communications network.'" ], "application/vnd.google.colaboratory.intrinsic+json": { "type": "string" } }, "metadata": {}, "execution_count": 12 } ] }, { "cell_type": "code", "source": [ "# Print info about the sizes of the train and validation sets\n", "print(f'Train dataset size: {dataset_dict[\"train\"].shape}')\n", "print(f'Validation dataset size: {dataset_dict[\"validation\"].shape}')" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "_737fP8byR80", "outputId": "682c7b64-bd44-4a77-f43c-3e498a4b88df" }, "execution_count": 13, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Train dataset size: (16153, 14)\n", "Validation dataset size: (9094, 14)\n" ] } ] }, { "cell_type": "markdown", "source": [ "## Pre-Processing the data" ], "metadata": { "id": "vsDHmJOQyaJo" } }, { "cell_type": "markdown", "source": [ "the label-to-index mapping for the decision status field by assigning the decision status labels to the class indices." ], "metadata": { "id": "Ir63W-lwyjIE" } }, { "cell_type": "code", "source": [ "# Label-to-index mapping for the decision status field\n", "decision_to_str = {'REJECTED': 0, 'ACCEPTED': 1, 'PENDING': 2, 'CONT-REJECTED': 3, 'CONT-ACCEPTED': 4, 'CONT-PENDING': 5}\n", "\n", "# Helper function\n", "def map_decision_to_string(example):\n", " return {'decision': decision_to_str[example['decision']]}" ], "metadata": { "id": "tmyPz1nRyZoG" }, "execution_count": 14, "outputs": [] }, { "cell_type": "markdown", "source": [ "re-label the decision status fields of the examples in the training and validation sets" ], "metadata": { "id": "3fN3dJrzypqJ" } }, { "cell_type": "code", "source": [ "# Re-labeling/mapping.\n", "train_set = dataset_dict['train'].map(map_decision_to_string)\n", "val_set = dataset_dict['validation'].map(map_decision_to_string)" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "7uH1FRQVyqf6", "outputId": "d887f592-86df-4576-b554-ea5ac60335ce" }, "execution_count": 15, "outputs": [ { "output_type": "stream", "name": "stderr", "text": [ "WARNING:datasets.arrow_dataset:Loading cached processed dataset at /root/.cache/huggingface/datasets/HUPD___hupd/sample-bf35d7d92b870122/0.0.0/6920d2def8fd7767046c0470603357f76866e5a09c97e19571896bfdca521142/cache-078dcfeb0f74c43d.arrow\n", "WARNING:datasets.arrow_dataset:Loading cached processed dataset at /root/.cache/huggingface/datasets/HUPD___hupd/sample-bf35d7d92b870122/0.0.0/6920d2def8fd7767046c0470603357f76866e5a09c97e19571896bfdca521142/cache-77ddc42467355d18.arrow\n" ] } ] }, { "cell_type": "code", "source": [ "# testing\n", "train_set[:1]" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "KEhTJpFj117_", "outputId": "d3ae3ec6-7235-4e0a-a668-24df06ba65d7" }, "execution_count": 16, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "{'patent_number': ['13261748'],\n", " 'decision': [1],\n", " 'title': ['MINI-OPTICAL NETWORK TERMINAL (ONT)'],\n", " 'abstract': ['The present invention relates to passive optical network (PON), and in particular, to an optical network terminal (ONT) in the PON system. In one embodiment, the optical network terminal includes a first interface coupled to a communications network, a second interface coupled to a network client and a processor including a memory coupled to the first interface and to the second interface, wherein the processor is capable of converting optical signals to electric signals, such that the network client can access the communications network.'],\n", " 'claims': ['1. A compact optical network terminal, comprising: a first interface coupled to a communications network; a second interface coupled to a network client, wherein the second interface is a network connectivity dongle with an optical transceiver at one end; and a processor including a circuitry and a memory coupled to the first interface and to the second interface, wherein the processor is capable of converting optical signals to electric signals, such that the network client can access the communications network thereby reducing the unnecessary splitting of equal upstream wavelengths to all the network clients in the network. 2. The optical network terminal of claim 1, wherein the first interface includes an optical module that receives optical signals via the optical fiber link and converts the optical signals to electrical signals. 3. The optical network terminal of claim 2, wherein the optical module is selectively configurable to support two or more of a broadband passive optical network (BPON), a gigabit-capable passive optical network (GPON), an Ethernet passive optical network (EPON), a gigabit-capable Ethernet passive optical network (GEPON) and an active Ethernet optical network. 4. The optical network terminal of claim 1, wherein the network client includes a converter unit for converting at least some of the electrical signals to data units which is selectively configurable to support a plurality of optical network protocols. 5. The optical, network terminal of claim 1, wherein the second interface includes a control circuitry which is capable of receiving the power from the network client for processing the received electrical signals thereby reducing the required protocol processing time from the network client. 6. The optical network terminal of claim 1, wherein the network client is capable of processing the xPON protocols to communicate with one or more Optical Line Terminal (OLT). 7. (canceled) 8. The optical network terminal of claim 1, wherein the second interface includes a Universal Serial Bus (USB) jack which is couplable to Universal Serial Bus (USB) plug or connector of the network client. 9. The optical network terminal of claim 1, wherein the at least one communication service with the xPON network comprises a first communication service and a second communication service, and wherein the communication service includes at least one voice communication service, a data communication service, and a video service. 10. (canceled)'],\n", " 'background': [\" BACKGROUND OF THE INVENTION A network interface device permits a subscriber to access a network. A passive optical network (PON) is an example of a network capable of delivering voice, video and other data among multiple network subscribers, using a common optical fiber link. Passive optical splitters and combiners enable multiple optical network terminals (ONTs) to share the optical fiber link. In a PON, each ONT terminates the optical fiber link for a residential or business subscriber, and is sometimes referred to as a subscriber premises node that delivers Fiber to the Premises (FTTP) services. An ONT is connected to one or more subscriber devices, such as televisions, set-top boxes, telephones, computers, or network appliances, which ultimately receive the voice, video and data delivered vii the PON. An ONT is an example of a network interface, device. Other examples of a network interface device, in different network types, include cable modems and digital subscriber line (DSL) boxes. Generally, a network also includes a network access interface. In a PON, the network access interface is sometimes referred to as an optical line terminator (OLT), having multiple, independent PON interface modules that serve multiple optical fiber links. A PON interface module provides an interface for transmission and reception of data packets over a particular optical fiber link that serves a group of ONTs. A PON is a downstream-multicast medium. Each packet transmitted on an optical fiber link can be received by every ONT served by that link. ONTs identify selected packets or frames on the fiber link based on addressing information included within the packets or frames. Network equipment, such as network interface devices, in a cable or hybrid network may be connected to power provided by a central office (CO), which commonly utilizes battery and generator back-up power to maintain a continuous power supply. In contrast, an ONT in an all-fiber optic network is ordinarily powered locally at the subscriber premises. For this reason, an ONT often includes a battery to provide backup power during a power outage to maintain critical services, such as voice service. Conventionally, the fibre of a PON typically terminates at a street cabinet to be shared by a number of subscriber equipment. The street cabinet houses an optical network terminal (ONT). The last few meters or kilometer from the street cabinet to a subscriber's home is typically bridged using existing twisted pair copper cables or radio links. The bandwidth resources of the fibre to the street cabinet are typically shared amongst a group of subscribers using an Ethernet switch. For example the fibre may extend to a street cabinet, a kerb outside a subscribers home, or directly into the subscribers home itself. Due to the bulkiness, size and complexity of the ONT cabinets are all factors that increase design difficulty and accrue additional costs. Also, the ONT itself is valuable, and its mounting on a wall, especially outside, makes it susceptible to theft or to being accidentally knocked down. Therefore, it would be desirable to have a compact optical network terminal to make passive optical networks seamlessly connected to regular computers and any other systems to overcome the above restrictions.\"],\n", " 'summary': [' SUMMARY OF THE INVENTION An aspect of the present invention is to address at least the above-mentioned problems and/or disadvantages and to provide at least the advantages described below. Accordingly, an aspect of the present invention is to provide a compact optical network terminal, comprising a first interface coupled to a communications network, a second interface coupled to a network client and a processor including a circuitry and a memory coupled to the first interface and to the second interface, wherein the processor is capable of converting optical signals to electric signals, such that the network client can access the communications network. Other aspects, advantages, and salient features of the invention will become apparent to those skilled in the art from the following detailed description, which, taken in conjunction with the annexed drawings, discloses exemplary embodiments of the invention.'],\n", " 'description': [\"FIELD OF THE INVENTION The present invention relates to the field of passive optical network (PON), and in particular, to an optical network terminal (ONT) in the PON system. BACKGROUND OF THE INVENTION A network interface device permits a subscriber to access a network. A passive optical network (PON) is an example of a network capable of delivering voice, video and other data among multiple network subscribers, using a common optical fiber link. Passive optical splitters and combiners enable multiple optical network terminals (ONTs) to share the optical fiber link. In a PON, each ONT terminates the optical fiber link for a residential or business subscriber, and is sometimes referred to as a subscriber premises node that delivers Fiber to the Premises (FTTP) services. An ONT is connected to one or more subscriber devices, such as televisions, set-top boxes, telephones, computers, or network appliances, which ultimately receive the voice, video and data delivered vii the PON. An ONT is an example of a network interface, device. Other examples of a network interface device, in different network types, include cable modems and digital subscriber line (DSL) boxes. Generally, a network also includes a network access interface. In a PON, the network access interface is sometimes referred to as an optical line terminator (OLT), having multiple, independent PON interface modules that serve multiple optical fiber links. A PON interface module provides an interface for transmission and reception of data packets over a particular optical fiber link that serves a group of ONTs. A PON is a downstream-multicast medium. Each packet transmitted on an optical fiber link can be received by every ONT served by that link. ONTs identify selected packets or frames on the fiber link based on addressing information included within the packets or frames. Network equipment, such as network interface devices, in a cable or hybrid network may be connected to power provided by a central office (CO), which commonly utilizes battery and generator back-up power to maintain a continuous power supply. In contrast, an ONT in an all-fiber optic network is ordinarily powered locally at the subscriber premises. For this reason, an ONT often includes a battery to provide backup power during a power outage to maintain critical services, such as voice service. Conventionally, the fibre of a PON typically terminates at a street cabinet to be shared by a number of subscriber equipment. The street cabinet houses an optical network terminal (ONT). The last few meters or kilometer from the street cabinet to a subscriber's home is typically bridged using existing twisted pair copper cables or radio links. The bandwidth resources of the fibre to the street cabinet are typically shared amongst a group of subscribers using an Ethernet switch. For example the fibre may extend to a street cabinet, a kerb outside a subscribers home, or directly into the subscribers home itself. Due to the bulkiness, size and complexity of the ONT cabinets are all factors that increase design difficulty and accrue additional costs. Also, the ONT itself is valuable, and its mounting on a wall, especially outside, makes it susceptible to theft or to being accidentally knocked down. Therefore, it would be desirable to have a compact optical network terminal to make passive optical networks seamlessly connected to regular computers and any other systems to overcome the above restrictions. SUMMARY OF THE INVENTION An aspect of the present invention is to address at least the above-mentioned problems and/or disadvantages and to provide at least the advantages described below. Accordingly, an aspect of the present invention is to provide a compact optical network terminal, comprising a first interface coupled to a communications network, a second interface coupled to a network client and a processor including a circuitry and a memory coupled to the first interface and to the second interface, wherein the processor is capable of converting optical signals to electric signals, such that the network client can access the communications network. Other aspects, advantages, and salient features of the invention will become apparent to those skilled in the art from the following detailed description, which, taken in conjunction with the annexed drawings, discloses exemplary embodiments of the invention. BRIEF DESCRIPTION OF THE DRAWINGS The above and other aspects, features, and advantages of certain exemplary embodiments of the present invention will be more apparent from the following description taken in conjunction with the accompanying drawings in which: FIG. 1A is a mechanical diagram of an optical network terminal (ONT) typical of customer premises equipment (CPE). FIG. 1B is a mechanical diagram of the ONT of FIG. 1A attached to a mounting bracket. FIG. 2 shows a typical Passive Optical Network (PON) Architecture. FIG. 3 shows a compatible optical network terminal (ONT) according to one embodiment of the present invention. FIG. 4 is a diagrammatic system view of a data processing system in which any of the embodiments disclosed herein may be performed. Persons skilled in the art will appreciate that elements in the figures are illustrated for simplicity and clarity and may have not been drawn to scale. For example, the dimensions of some of the elements in the figure may be exaggerated relative to other elements to help to improve understanding of various exemplary embodiments of the present disclosure. Throughout the drawings, it should be noted that like reference numbers are used to depict the same or similar elements, features, and structures. DETAIL DESCRIPTION OF THE INVENTION The following description with reference to the accompanying drawings is provided to assist in a comprehensive understanding of exemplary embodiments of the invention as defined by the claims and their equivalents. It includes various specific details to assist in that understanding but′ these are to be regarded as merely exemplary. Accordingly, those of ordinary skill in the art will recognize that various changes and modifications of the embodiments described herein can be made without departing from the scope and spirit of the invention. In addition, descriptions of well-known functions and constructions are omitted for clarity and conciseness. The terms and words used in the following description and claims are not limited to the bibliographical meanings, but, are merely used by the inventor to enable a clear and consistent understanding of the invention. Accordingly, it should be apparent to those skilled in the art that the following description of exemplary embodiments of the present invention are provided for illustration purpose only and not for the purpose of limiting the invention as defined by the appended claims and their equivalents. It is to be understood that the singular forms “a,” “an,” and “the” include plural referents unless the context clearly dictates otherwise. Thus, for example, reference to “a component surface” includes reference to one or more of such surfaces. By the term “substantially” it is meant that the recited characteristic, parameter, or value need not be achieved exactly, but that deviations or variations, including for example, tolerances, measurement error, measurement accuracy limitations and other factors known to those of skill in the art, may occur in amounts that do not preclude the effect the characteristic was intended to provide. FIGS. 1 through 4, discussed below, and the various embodiments used to describe the principles of the present disclosure in this patent document are by way of illustration only and should not be construed in any way that would limit the scope of the disclosure. Those skilled in the art will understand that the principles of the present disclosure may be implemented in any suitably arranged communications system. The terms used to describe various embodiments are exemplary. It should be understood that these are provided to merely aid the understanding of the description, and that their use and definitions in no way limit the scope of the invention. Terms first, second, and the like are used to differentiate between objects having the same terminology and are in no way intended to represent a chronological order, unless where explicitly stated otherwise. A set is defined as a non-empty set including at least one element. FIG. 1A shows an optical network terminal (ONT) 100, which is an example of customer premises equipment (CPE), that connects a customer's communications equipment, e.g., computers, telephones, and televisions, to a telecommunications service provider. The ONT 100 includes an outer case 102 with an engagable cover 104 that covers a battery compartment (not shown) or another cavity of the ONT 100. A face 106 of the ONT 100 carries various connectors, including a power connector 108, coaxial cable connector 110, fiber optic cable connector 112, Ethernet (CAT-5) connector 114, and two telephone connectors 116. The ONT 100 transmits data to and receives data from a telecommunications network (not shown) via a fiber optic cable (not shown) connected to a fiber optic cable connector 112. Televisions, computers, and telephones on the customer's premises may be connected to the coaxial cable connector 110, Ethernet connector 114, and telephone connectors 116, respectively, on the ONT 100. FIG. 1B shows the ONT 100 of FIG. 1A with connector details with a bracket 120 attached to the outer case 102. The bracket 120 may be mounted to a wall (not shown), and the ONT 100 may be hung on the bracket. In many applications, the bracket 120 is installed on an exterior wall of a building or inside a garage, locations at which the ONT may be exposed to large temperature variations and different weather conditions. FIG. 2 shows a general Passive Optical Network (PON) Architecture. The elements of a PON are (i) Optical Line Terminal (OLT) 210 (ii) Passive Optical Splitter 220 and (iii) Optical Network Unit (ONU) 230. The Optical Line Terminal 210 is the main element of the network and is usually placed in the Local Exchange. It is a network element with PON line card, basically a aggregation switch. It works as an interface between core network and PON network. Optical Splitter 220 is a passive device with single input and multiple outputs. Optical power at input is split evenly between outputs. Not only signal travels from input to the outputs, signal can also travel from the output to the input. Splitters can be placed anywhere in between Central Office (CO) and Subscriber premises. It is used to connect an optical port of OLT with multiple subscribers. Optical Network units (ONUs) 230 serve as an interface to the network and are deployed at customer premises 240. It provides several interfaces for accessing triple play services and in the upper side it connects with the OLT via optical splitter. Although PONs can exist in three basic configuration (tree, bus and ring), the tree topology is favored due to smaller variation in the signal power from different end station. PON uses 1490 nm for the downstream wavelength and 1310 nm for the upstream wavelength. Signals are inserted or extracted from the fibre using a coarse wavelength division multiplexer (CWDM) filter at the CO and subscriber premises. FIG. 3 shows a compatible optical network terminal (ONT) according to one embodiment of the present invention. The optical network terminal (ONT) 300 includes a first interface 310, a second interface 320 and a middle region 330 sandwiched between the first and second interface. The first interface 310 coupled to a communications network 340, a second interface 320 coupled to a network client 350. The first interface is connected through a dedicated optical fiber link 360 (bi-directional) to receive optical signals from one or more communication network 340. The communication network may be or may include one or more but not limited to any of the xPON network 340 (e.g. of a broadband passive optical network (BPON), a gigabit-capable passive optical network (GPON), an Ethernet passive optical network (EPON), a gigabit-capable Ethernet passive optical network (GEPON), an active Ethernet optical network and any other future passive optical networks etc). The second interface 320 is coupled to the network client 350 though a USB port. In an operation, the middle region which may be a processor 330 including a memory (not shown in figure) coupled to the first interface 310 and to the second interface 320, wherein the processor 330 includes a circuitry which is configured for converting optical signals to electric signals, such that the network client can access the communications network. The first interface 310 may include an optical module (not shown in figure) which receives optical signals via the optical fiber link 360 and capable of converting the optical signals to electrical signals. The second interface 320 may include a control circuit (not shown in figure) which is capable of receiving the power from the network client 350 for processing the received electrical signals thereby reducing the required protocol processing time from the network client. Due to this behavior of the second interface 320 results in simplifying the ONT design by offloading the “non-volatile” part of the software to the network client 350 and downloading it on power to turn it. Most of the backend work can also be done by a software driver residing in the network client. Further, the second interface 320 acts as a network connectivity dongle with an optical transceiver at one end. Furthermore, the second interface may include a Universal Serial Bus (USB) jack which is couplable to Universal Serial Bus (USB) plug or connector of the network client 350. The second interface 320 capable of power up the “dongle” to connect it to the central office or Optical Line Terminal (OLT) by excluding external power source as required in the conventional design of ONT. In an example operation the Optical Network Terminal. (ONT) is connected to the network client through a USB port. Once the USB port of the network client 360 is coupled to the USB interface i.e. second interface 320, one or more driver needs to be installed at the network client 360 which then onwards controls the USB dongle (ONT) with the configured parameters at the installation time. The software boots up the USB dongle and communicates to network client 360 as a memory device with a built-in driver. The xPON protocol selected at the network client 360 will run and then converts the data coming from the WAN/LAN side to network client 360 as a network device. Once the software starts running in the network client 360, it would get connected to the OLT using the required xPON protocol. Once the network client 360 and the xPON network are connected, each network client 360 will have a dedicated connection (e.g. speed, bandwidth etc) as requested or selected by the client side. By this kind of novel and compatible design i.e. having xPON interface on one side and USB protocol interface on the other side will eradicate the necessity of the external power for the ONT. Also, by this kind of compatible design reduce the unnecessary splitting of equal upstream wavelength to all the network clients in the network. The network client may be or may include a host computer, a optical network unit, a optical network terminal or any other unit or terminal or device which is capable of accessing the passive optical network (xPON). FIG. 4 is a diagrammatic system view 400 of a data processing system in which any of the embodiments disclosed herein may be performed, according to one embodiment. Particularly, the diagrammatic system view of FIG. 4 illustrates a processor 402, a main memory 404, a static memory 406, a bus 408, a video display 410, an alpha-numeric input device 412, a cursor control device 414, a drive unit 416, a signal generation device 418, a network interface device 420, a machine readable medium 422, instructions 424 and a network 426. The diagrammatic system view 400 may indicate a personal computer and/or a data processing system in which one or more operations disclosed herein are performed. The processor 402 may be a microprocessor, a state machine, an application specific integrated circuit, a field programmable gate array; etc. (e.g., Intel® Pentium® processor). The main memory 404 may be a dynamic random access memory and/or a primary memory of a computer system. The static memory 406 may be a hard drive, a flash drive, and/or other memory information associated with the data processing system. The bus 408 may be an interconnection between various circuits and/or structures of the data processing system. The video display 410 may provide graphical representation of information on the data processing system. The alpha-numeric input device 412 may be a keypad, keyboard and/or any other input device of text (e.g., a special device to aid the physically handicapped). The cursor control device 414 may be a pointing device such as a mouse. The drive unit 416 may be a hard drive, a storage system, and/or other longer term storage subsystem. The signal generation device 418 may be a bios and/or a functional operating system of the data processing system. The network interface device 420 may perform interface functions (e.g., code conversion, protocol conversion, and/or buffering) required for communications to and from the network 426 between a number of independent devices (e.g., of varying protocols). The machine readable medium 422 may provide instructions on which any of the methods disclosed herein may be performed. The instructions 424 may provide source code and/or data code to the processor 402 to enable any one/or more operations disclosed herein. FIGS. 1-4 are merely representational and are not drawn to scale. Certain portions thereof may be exaggerated, while others may be minimized. FIGS. 1-4 illustrate various embodiments of the invention that can be understood and appropriately carried out by those of ordinary skill in the art. In the foregoing detailed description of embodiments of the invention, various features are grouped together in a single embodiment for the purpose of streamlining the disclosure. This method of disclosure is not to be interpreted as reflecting an intention that the claimed embodiments of the invention require more features than are expressly recited in each claim. Rather, as the following claims reflect, inventive subject matter lies in less than all features of a single disclosed embodiment. Thus, the following claims are hereby incorporated into the detailed description of embodiments of the invention, with each claim standing on its own as a separate embodiment. It is understood that the above description is intended to be illustrative, and not restrictive. It is intended to cover all alternatives, modifications and equivalents as may be included within the spirit and scope of the invention as defined in the appended claims. Many other embodiments will be apparent to those of skill in the art upon reviewing the above description. The scope of the invention should, therefore, be determined with reference to the appended claims, along with the full scope of equivalents to which such claims are entitled. In the appended claims, the terms “including” and “in which” are used as the plain-English equivalents of the respective terms “comprising” and “wherein,” respectively.\"],\n", " 'cpc_label': ['H04Q110071'],\n", " 'ipc_label': ['H04Q1100'],\n", " 'filing_date': ['20160120'],\n", " 'patent_issue_date': ['20170606'],\n", " 'date_published': ['20160526'],\n", " 'examiner_id': ['95191.0']}" ] }, "metadata": {}, "execution_count": 16 } ] }, { "cell_type": "markdown", "source": [ "the abstract section of the patent applications" ], "metadata": { "id": "0S8N1KyZy4Gg" } }, { "cell_type": "code", "source": [ "# Focus on the abstract section and tokenize the text using the tokenizer.\n", "_SECTION_ = 'abstract'" ], "metadata": { "id": "DSQTi4POy31s" }, "execution_count": 17, "outputs": [] }, { "cell_type": "code", "source": [ "# Training set\n", "train_set = train_set.map(\n", " lambda e: tokenizer((e[_SECTION_]), truncation=True, padding='max_length'),\n", " batched=True)" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "wFNuWMLs0Kk7", "outputId": "2410867b-863b-4f6e-b02a-a7741f6fa679" }, "execution_count": 18, "outputs": [ { "output_type": "stream", "name": "stderr", "text": [ "WARNING:datasets.arrow_dataset:Loading cached processed dataset at /root/.cache/huggingface/datasets/HUPD___hupd/sample-bf35d7d92b870122/0.0.0/6920d2def8fd7767046c0470603357f76866e5a09c97e19571896bfdca521142/cache-42411569b48e4939.arrow\n" ] } ] }, { "cell_type": "code", "source": [ "# Validation set\n", "val_set = val_set.map(\n", " lambda e: tokenizer((e[_SECTION_]), truncation=True, padding='max_length'),\n", " batched=True)" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "DW9OGw-_0Qt5", "outputId": "edf94bac-8228-4658-9664-9b0f3b323089" }, "execution_count": 19, "outputs": [ { "output_type": "stream", "name": "stderr", "text": [ "WARNING:datasets.arrow_dataset:Loading cached processed dataset at /root/.cache/huggingface/datasets/HUPD___hupd/sample-bf35d7d92b870122/0.0.0/6920d2def8fd7767046c0470603357f76866e5a09c97e19571896bfdca521142/cache-c490cf51d00ce442.arrow\n" ] } ] }, { "cell_type": "code", "source": [ "train_set[:1]" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "dStdZuT15oiJ", "outputId": "76f29929-27af-4a37-d258-e510df7b63d1" }, "execution_count": 20, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "{'patent_number': ['13261748'],\n", " 'decision': [1],\n", " 'title': ['MINI-OPTICAL NETWORK TERMINAL (ONT)'],\n", " 'abstract': ['The present invention relates to passive optical network (PON), and in particular, to an optical network terminal (ONT) in the PON system. In one embodiment, the optical network terminal includes a first interface coupled to a communications network, a second interface coupled to a network client and a processor including a memory coupled to the first interface and to the second interface, wherein the processor is capable of converting optical signals to electric signals, such that the network client can access the communications network.'],\n", " 'claims': ['1. A compact optical network terminal, comprising: a first interface coupled to a communications network; a second interface coupled to a network client, wherein the second interface is a network connectivity dongle with an optical transceiver at one end; and a processor including a circuitry and a memory coupled to the first interface and to the second interface, wherein the processor is capable of converting optical signals to electric signals, such that the network client can access the communications network thereby reducing the unnecessary splitting of equal upstream wavelengths to all the network clients in the network. 2. The optical network terminal of claim 1, wherein the first interface includes an optical module that receives optical signals via the optical fiber link and converts the optical signals to electrical signals. 3. The optical network terminal of claim 2, wherein the optical module is selectively configurable to support two or more of a broadband passive optical network (BPON), a gigabit-capable passive optical network (GPON), an Ethernet passive optical network (EPON), a gigabit-capable Ethernet passive optical network (GEPON) and an active Ethernet optical network. 4. The optical network terminal of claim 1, wherein the network client includes a converter unit for converting at least some of the electrical signals to data units which is selectively configurable to support a plurality of optical network protocols. 5. The optical, network terminal of claim 1, wherein the second interface includes a control circuitry which is capable of receiving the power from the network client for processing the received electrical signals thereby reducing the required protocol processing time from the network client. 6. The optical network terminal of claim 1, wherein the network client is capable of processing the xPON protocols to communicate with one or more Optical Line Terminal (OLT). 7. (canceled) 8. The optical network terminal of claim 1, wherein the second interface includes a Universal Serial Bus (USB) jack which is couplable to Universal Serial Bus (USB) plug or connector of the network client. 9. The optical network terminal of claim 1, wherein the at least one communication service with the xPON network comprises a first communication service and a second communication service, and wherein the communication service includes at least one voice communication service, a data communication service, and a video service. 10. (canceled)'],\n", " 'background': [\" BACKGROUND OF THE INVENTION A network interface device permits a subscriber to access a network. A passive optical network (PON) is an example of a network capable of delivering voice, video and other data among multiple network subscribers, using a common optical fiber link. Passive optical splitters and combiners enable multiple optical network terminals (ONTs) to share the optical fiber link. In a PON, each ONT terminates the optical fiber link for a residential or business subscriber, and is sometimes referred to as a subscriber premises node that delivers Fiber to the Premises (FTTP) services. An ONT is connected to one or more subscriber devices, such as televisions, set-top boxes, telephones, computers, or network appliances, which ultimately receive the voice, video and data delivered vii the PON. An ONT is an example of a network interface, device. Other examples of a network interface device, in different network types, include cable modems and digital subscriber line (DSL) boxes. Generally, a network also includes a network access interface. In a PON, the network access interface is sometimes referred to as an optical line terminator (OLT), having multiple, independent PON interface modules that serve multiple optical fiber links. A PON interface module provides an interface for transmission and reception of data packets over a particular optical fiber link that serves a group of ONTs. A PON is a downstream-multicast medium. Each packet transmitted on an optical fiber link can be received by every ONT served by that link. ONTs identify selected packets or frames on the fiber link based on addressing information included within the packets or frames. Network equipment, such as network interface devices, in a cable or hybrid network may be connected to power provided by a central office (CO), which commonly utilizes battery and generator back-up power to maintain a continuous power supply. In contrast, an ONT in an all-fiber optic network is ordinarily powered locally at the subscriber premises. For this reason, an ONT often includes a battery to provide backup power during a power outage to maintain critical services, such as voice service. Conventionally, the fibre of a PON typically terminates at a street cabinet to be shared by a number of subscriber equipment. The street cabinet houses an optical network terminal (ONT). The last few meters or kilometer from the street cabinet to a subscriber's home is typically bridged using existing twisted pair copper cables or radio links. The bandwidth resources of the fibre to the street cabinet are typically shared amongst a group of subscribers using an Ethernet switch. For example the fibre may extend to a street cabinet, a kerb outside a subscribers home, or directly into the subscribers home itself. Due to the bulkiness, size and complexity of the ONT cabinets are all factors that increase design difficulty and accrue additional costs. Also, the ONT itself is valuable, and its mounting on a wall, especially outside, makes it susceptible to theft or to being accidentally knocked down. Therefore, it would be desirable to have a compact optical network terminal to make passive optical networks seamlessly connected to regular computers and any other systems to overcome the above restrictions.\"],\n", " 'summary': [' SUMMARY OF THE INVENTION An aspect of the present invention is to address at least the above-mentioned problems and/or disadvantages and to provide at least the advantages described below. Accordingly, an aspect of the present invention is to provide a compact optical network terminal, comprising a first interface coupled to a communications network, a second interface coupled to a network client and a processor including a circuitry and a memory coupled to the first interface and to the second interface, wherein the processor is capable of converting optical signals to electric signals, such that the network client can access the communications network. Other aspects, advantages, and salient features of the invention will become apparent to those skilled in the art from the following detailed description, which, taken in conjunction with the annexed drawings, discloses exemplary embodiments of the invention.'],\n", " 'description': [\"FIELD OF THE INVENTION The present invention relates to the field of passive optical network (PON), and in particular, to an optical network terminal (ONT) in the PON system. BACKGROUND OF THE INVENTION A network interface device permits a subscriber to access a network. A passive optical network (PON) is an example of a network capable of delivering voice, video and other data among multiple network subscribers, using a common optical fiber link. Passive optical splitters and combiners enable multiple optical network terminals (ONTs) to share the optical fiber link. In a PON, each ONT terminates the optical fiber link for a residential or business subscriber, and is sometimes referred to as a subscriber premises node that delivers Fiber to the Premises (FTTP) services. An ONT is connected to one or more subscriber devices, such as televisions, set-top boxes, telephones, computers, or network appliances, which ultimately receive the voice, video and data delivered vii the PON. An ONT is an example of a network interface, device. Other examples of a network interface device, in different network types, include cable modems and digital subscriber line (DSL) boxes. Generally, a network also includes a network access interface. In a PON, the network access interface is sometimes referred to as an optical line terminator (OLT), having multiple, independent PON interface modules that serve multiple optical fiber links. A PON interface module provides an interface for transmission and reception of data packets over a particular optical fiber link that serves a group of ONTs. A PON is a downstream-multicast medium. Each packet transmitted on an optical fiber link can be received by every ONT served by that link. ONTs identify selected packets or frames on the fiber link based on addressing information included within the packets or frames. Network equipment, such as network interface devices, in a cable or hybrid network may be connected to power provided by a central office (CO), which commonly utilizes battery and generator back-up power to maintain a continuous power supply. In contrast, an ONT in an all-fiber optic network is ordinarily powered locally at the subscriber premises. For this reason, an ONT often includes a battery to provide backup power during a power outage to maintain critical services, such as voice service. Conventionally, the fibre of a PON typically terminates at a street cabinet to be shared by a number of subscriber equipment. The street cabinet houses an optical network terminal (ONT). The last few meters or kilometer from the street cabinet to a subscriber's home is typically bridged using existing twisted pair copper cables or radio links. The bandwidth resources of the fibre to the street cabinet are typically shared amongst a group of subscribers using an Ethernet switch. For example the fibre may extend to a street cabinet, a kerb outside a subscribers home, or directly into the subscribers home itself. Due to the bulkiness, size and complexity of the ONT cabinets are all factors that increase design difficulty and accrue additional costs. Also, the ONT itself is valuable, and its mounting on a wall, especially outside, makes it susceptible to theft or to being accidentally knocked down. Therefore, it would be desirable to have a compact optical network terminal to make passive optical networks seamlessly connected to regular computers and any other systems to overcome the above restrictions. SUMMARY OF THE INVENTION An aspect of the present invention is to address at least the above-mentioned problems and/or disadvantages and to provide at least the advantages described below. Accordingly, an aspect of the present invention is to provide a compact optical network terminal, comprising a first interface coupled to a communications network, a second interface coupled to a network client and a processor including a circuitry and a memory coupled to the first interface and to the second interface, wherein the processor is capable of converting optical signals to electric signals, such that the network client can access the communications network. Other aspects, advantages, and salient features of the invention will become apparent to those skilled in the art from the following detailed description, which, taken in conjunction with the annexed drawings, discloses exemplary embodiments of the invention. BRIEF DESCRIPTION OF THE DRAWINGS The above and other aspects, features, and advantages of certain exemplary embodiments of the present invention will be more apparent from the following description taken in conjunction with the accompanying drawings in which: FIG. 1A is a mechanical diagram of an optical network terminal (ONT) typical of customer premises equipment (CPE). FIG. 1B is a mechanical diagram of the ONT of FIG. 1A attached to a mounting bracket. FIG. 2 shows a typical Passive Optical Network (PON) Architecture. FIG. 3 shows a compatible optical network terminal (ONT) according to one embodiment of the present invention. FIG. 4 is a diagrammatic system view of a data processing system in which any of the embodiments disclosed herein may be performed. Persons skilled in the art will appreciate that elements in the figures are illustrated for simplicity and clarity and may have not been drawn to scale. For example, the dimensions of some of the elements in the figure may be exaggerated relative to other elements to help to improve understanding of various exemplary embodiments of the present disclosure. Throughout the drawings, it should be noted that like reference numbers are used to depict the same or similar elements, features, and structures. DETAIL DESCRIPTION OF THE INVENTION The following description with reference to the accompanying drawings is provided to assist in a comprehensive understanding of exemplary embodiments of the invention as defined by the claims and their equivalents. It includes various specific details to assist in that understanding but′ these are to be regarded as merely exemplary. Accordingly, those of ordinary skill in the art will recognize that various changes and modifications of the embodiments described herein can be made without departing from the scope and spirit of the invention. In addition, descriptions of well-known functions and constructions are omitted for clarity and conciseness. The terms and words used in the following description and claims are not limited to the bibliographical meanings, but, are merely used by the inventor to enable a clear and consistent understanding of the invention. Accordingly, it should be apparent to those skilled in the art that the following description of exemplary embodiments of the present invention are provided for illustration purpose only and not for the purpose of limiting the invention as defined by the appended claims and their equivalents. It is to be understood that the singular forms “a,” “an,” and “the” include plural referents unless the context clearly dictates otherwise. Thus, for example, reference to “a component surface” includes reference to one or more of such surfaces. By the term “substantially” it is meant that the recited characteristic, parameter, or value need not be achieved exactly, but that deviations or variations, including for example, tolerances, measurement error, measurement accuracy limitations and other factors known to those of skill in the art, may occur in amounts that do not preclude the effect the characteristic was intended to provide. FIGS. 1 through 4, discussed below, and the various embodiments used to describe the principles of the present disclosure in this patent document are by way of illustration only and should not be construed in any way that would limit the scope of the disclosure. Those skilled in the art will understand that the principles of the present disclosure may be implemented in any suitably arranged communications system. The terms used to describe various embodiments are exemplary. It should be understood that these are provided to merely aid the understanding of the description, and that their use and definitions in no way limit the scope of the invention. Terms first, second, and the like are used to differentiate between objects having the same terminology and are in no way intended to represent a chronological order, unless where explicitly stated otherwise. A set is defined as a non-empty set including at least one element. FIG. 1A shows an optical network terminal (ONT) 100, which is an example of customer premises equipment (CPE), that connects a customer's communications equipment, e.g., computers, telephones, and televisions, to a telecommunications service provider. The ONT 100 includes an outer case 102 with an engagable cover 104 that covers a battery compartment (not shown) or another cavity of the ONT 100. A face 106 of the ONT 100 carries various connectors, including a power connector 108, coaxial cable connector 110, fiber optic cable connector 112, Ethernet (CAT-5) connector 114, and two telephone connectors 116. The ONT 100 transmits data to and receives data from a telecommunications network (not shown) via a fiber optic cable (not shown) connected to a fiber optic cable connector 112. Televisions, computers, and telephones on the customer's premises may be connected to the coaxial cable connector 110, Ethernet connector 114, and telephone connectors 116, respectively, on the ONT 100. FIG. 1B shows the ONT 100 of FIG. 1A with connector details with a bracket 120 attached to the outer case 102. The bracket 120 may be mounted to a wall (not shown), and the ONT 100 may be hung on the bracket. In many applications, the bracket 120 is installed on an exterior wall of a building or inside a garage, locations at which the ONT may be exposed to large temperature variations and different weather conditions. FIG. 2 shows a general Passive Optical Network (PON) Architecture. The elements of a PON are (i) Optical Line Terminal (OLT) 210 (ii) Passive Optical Splitter 220 and (iii) Optical Network Unit (ONU) 230. The Optical Line Terminal 210 is the main element of the network and is usually placed in the Local Exchange. It is a network element with PON line card, basically a aggregation switch. It works as an interface between core network and PON network. Optical Splitter 220 is a passive device with single input and multiple outputs. Optical power at input is split evenly between outputs. Not only signal travels from input to the outputs, signal can also travel from the output to the input. Splitters can be placed anywhere in between Central Office (CO) and Subscriber premises. It is used to connect an optical port of OLT with multiple subscribers. Optical Network units (ONUs) 230 serve as an interface to the network and are deployed at customer premises 240. It provides several interfaces for accessing triple play services and in the upper side it connects with the OLT via optical splitter. Although PONs can exist in three basic configuration (tree, bus and ring), the tree topology is favored due to smaller variation in the signal power from different end station. PON uses 1490 nm for the downstream wavelength and 1310 nm for the upstream wavelength. Signals are inserted or extracted from the fibre using a coarse wavelength division multiplexer (CWDM) filter at the CO and subscriber premises. FIG. 3 shows a compatible optical network terminal (ONT) according to one embodiment of the present invention. The optical network terminal (ONT) 300 includes a first interface 310, a second interface 320 and a middle region 330 sandwiched between the first and second interface. The first interface 310 coupled to a communications network 340, a second interface 320 coupled to a network client 350. The first interface is connected through a dedicated optical fiber link 360 (bi-directional) to receive optical signals from one or more communication network 340. The communication network may be or may include one or more but not limited to any of the xPON network 340 (e.g. of a broadband passive optical network (BPON), a gigabit-capable passive optical network (GPON), an Ethernet passive optical network (EPON), a gigabit-capable Ethernet passive optical network (GEPON), an active Ethernet optical network and any other future passive optical networks etc). The second interface 320 is coupled to the network client 350 though a USB port. In an operation, the middle region which may be a processor 330 including a memory (not shown in figure) coupled to the first interface 310 and to the second interface 320, wherein the processor 330 includes a circuitry which is configured for converting optical signals to electric signals, such that the network client can access the communications network. The first interface 310 may include an optical module (not shown in figure) which receives optical signals via the optical fiber link 360 and capable of converting the optical signals to electrical signals. The second interface 320 may include a control circuit (not shown in figure) which is capable of receiving the power from the network client 350 for processing the received electrical signals thereby reducing the required protocol processing time from the network client. Due to this behavior of the second interface 320 results in simplifying the ONT design by offloading the “non-volatile” part of the software to the network client 350 and downloading it on power to turn it. Most of the backend work can also be done by a software driver residing in the network client. Further, the second interface 320 acts as a network connectivity dongle with an optical transceiver at one end. Furthermore, the second interface may include a Universal Serial Bus (USB) jack which is couplable to Universal Serial Bus (USB) plug or connector of the network client 350. The second interface 320 capable of power up the “dongle” to connect it to the central office or Optical Line Terminal (OLT) by excluding external power source as required in the conventional design of ONT. In an example operation the Optical Network Terminal. (ONT) is connected to the network client through a USB port. Once the USB port of the network client 360 is coupled to the USB interface i.e. second interface 320, one or more driver needs to be installed at the network client 360 which then onwards controls the USB dongle (ONT) with the configured parameters at the installation time. The software boots up the USB dongle and communicates to network client 360 as a memory device with a built-in driver. The xPON protocol selected at the network client 360 will run and then converts the data coming from the WAN/LAN side to network client 360 as a network device. Once the software starts running in the network client 360, it would get connected to the OLT using the required xPON protocol. Once the network client 360 and the xPON network are connected, each network client 360 will have a dedicated connection (e.g. speed, bandwidth etc) as requested or selected by the client side. By this kind of novel and compatible design i.e. having xPON interface on one side and USB protocol interface on the other side will eradicate the necessity of the external power for the ONT. Also, by this kind of compatible design reduce the unnecessary splitting of equal upstream wavelength to all the network clients in the network. The network client may be or may include a host computer, a optical network unit, a optical network terminal or any other unit or terminal or device which is capable of accessing the passive optical network (xPON). FIG. 4 is a diagrammatic system view 400 of a data processing system in which any of the embodiments disclosed herein may be performed, according to one embodiment. Particularly, the diagrammatic system view of FIG. 4 illustrates a processor 402, a main memory 404, a static memory 406, a bus 408, a video display 410, an alpha-numeric input device 412, a cursor control device 414, a drive unit 416, a signal generation device 418, a network interface device 420, a machine readable medium 422, instructions 424 and a network 426. The diagrammatic system view 400 may indicate a personal computer and/or a data processing system in which one or more operations disclosed herein are performed. The processor 402 may be a microprocessor, a state machine, an application specific integrated circuit, a field programmable gate array; etc. (e.g., Intel® Pentium® processor). The main memory 404 may be a dynamic random access memory and/or a primary memory of a computer system. The static memory 406 may be a hard drive, a flash drive, and/or other memory information associated with the data processing system. The bus 408 may be an interconnection between various circuits and/or structures of the data processing system. The video display 410 may provide graphical representation of information on the data processing system. The alpha-numeric input device 412 may be a keypad, keyboard and/or any other input device of text (e.g., a special device to aid the physically handicapped). The cursor control device 414 may be a pointing device such as a mouse. The drive unit 416 may be a hard drive, a storage system, and/or other longer term storage subsystem. The signal generation device 418 may be a bios and/or a functional operating system of the data processing system. The network interface device 420 may perform interface functions (e.g., code conversion, protocol conversion, and/or buffering) required for communications to and from the network 426 between a number of independent devices (e.g., of varying protocols). The machine readable medium 422 may provide instructions on which any of the methods disclosed herein may be performed. The instructions 424 may provide source code and/or data code to the processor 402 to enable any one/or more operations disclosed herein. FIGS. 1-4 are merely representational and are not drawn to scale. Certain portions thereof may be exaggerated, while others may be minimized. FIGS. 1-4 illustrate various embodiments of the invention that can be understood and appropriately carried out by those of ordinary skill in the art. In the foregoing detailed description of embodiments of the invention, various features are grouped together in a single embodiment for the purpose of streamlining the disclosure. This method of disclosure is not to be interpreted as reflecting an intention that the claimed embodiments of the invention require more features than are expressly recited in each claim. Rather, as the following claims reflect, inventive subject matter lies in less than all features of a single disclosed embodiment. Thus, the following claims are hereby incorporated into the detailed description of embodiments of the invention, with each claim standing on its own as a separate embodiment. It is understood that the above description is intended to be illustrative, and not restrictive. It is intended to cover all alternatives, modifications and equivalents as may be included within the spirit and scope of the invention as defined in the appended claims. Many other embodiments will be apparent to those of skill in the art upon reviewing the above description. The scope of the invention should, therefore, be determined with reference to the appended claims, along with the full scope of equivalents to which such claims are entitled. In the appended claims, the terms “including” and “in which” are used as the plain-English equivalents of the respective terms “comprising” and “wherein,” respectively.\"],\n", " 'cpc_label': ['H04Q110071'],\n", " 'ipc_label': ['H04Q1100'],\n", " 'filing_date': ['20160120'],\n", " 'patent_issue_date': ['20170606'],\n", " 'date_published': ['20160526'],\n", " 'examiner_id': ['95191.0'],\n", " 'input_ids': [[101,\n", " 1996,\n", " 2556,\n", " 11028,\n", " 14623,\n", " 2000,\n", " 13135,\n", " 9380,\n", " 2897,\n", " 1006,\n", " 13433,\n", " 2078,\n", " 1007,\n", " 1010,\n", " 1998,\n", " 1999,\n", " 3327,\n", " 1010,\n", " 2000,\n", " 2019,\n", " 9380,\n", " 2897,\n", " 5536,\n", " 1006,\n", " 2006,\n", " 2102,\n", " 1007,\n", " 1999,\n", " 1996,\n", " 13433,\n", " 2078,\n", " 2291,\n", " 1012,\n", " 1999,\n", " 2028,\n", " 7861,\n", " 5092,\n", " 21341,\n", " 1010,\n", " 1996,\n", " 9380,\n", " 2897,\n", " 5536,\n", " 2950,\n", " 1037,\n", " 2034,\n", " 8278,\n", " 11211,\n", " 2000,\n", " 1037,\n", " 4806,\n", " 2897,\n", " 1010,\n", " 1037,\n", " 2117,\n", " 8278,\n", " 11211,\n", " 2000,\n", " 1037,\n", " 2897,\n", " 7396,\n", " 1998,\n", " 1037,\n", " 13151,\n", " 2164,\n", " 1037,\n", " 3638,\n", " 11211,\n", " 2000,\n", " 1996,\n", " 2034,\n", " 8278,\n", " 1998,\n", " 2000,\n", " 1996,\n", " 2117,\n", " 8278,\n", " 1010,\n", " 16726,\n", " 1996,\n", " 13151,\n", " 2003,\n", " 5214,\n", " 1997,\n", " 16401,\n", " 9380,\n", " 7755,\n", " 2000,\n", " 3751,\n", " 7755,\n", " 1010,\n", " 2107,\n", " 2008,\n", " 1996,\n", " 2897,\n", " 7396,\n", " 2064,\n", " 3229,\n", " 1996,\n", " 4806,\n", " 2897,\n", " 1012,\n", " 102,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0]],\n", " 'attention_mask': [[1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0]]}" ] }, "metadata": {}, "execution_count": 20 } ] }, { "cell_type": "markdown", "source": [ "the claims section of the patent applications" ], "metadata": { "id": "anpCrdUr9_0_" } }, { "cell_type": "code", "source": [ "# Focus on the abstract section and tokenize the text using the tokenizer.\n", "_SECTION1_ = 'claims'" ], "metadata": { "id": "vIN41V3X-Boh" }, "execution_count": 21, "outputs": [] }, { "cell_type": "code", "source": [ "# Training set\n", "train_set = train_set.map(\n", " lambda e: tokenizer((e[_SECTION1_]), truncation=True, padding='max_length'),\n", " batched=True)" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "JOvF2Egv-GAp", "outputId": "78121db0-4e1d-452a-9cac-56d4daa0058b" }, "execution_count": 22, "outputs": [ { "output_type": "stream", "name": "stderr", "text": [ "WARNING:datasets.arrow_dataset:Loading cached processed dataset at /root/.cache/huggingface/datasets/HUPD___hupd/sample-bf35d7d92b870122/0.0.0/6920d2def8fd7767046c0470603357f76866e5a09c97e19571896bfdca521142/cache-c6955ad5199fbd84.arrow\n" ] } ] }, { "cell_type": "code", "source": [ "# Validation set\n", "val_set = val_set.map(\n", " lambda e: tokenizer((e[_SECTION1_]), truncation=True, padding='max_length'),\n", " batched=True)" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 17, "referenced_widgets": [ "2979cc614ea7448b8575d09fab4959d0", "78d5deb4cbf74aabaae89a42ceee72eb", "da7f9d8912fd403e85379419cd518023", "1564a0d3efc0455bae2c3d90325a4571", "734777f838be43f0b3e9c954e393d691", "df64aa40c8e0419f87075288d9383483", "ca7be44dc07d41829a2d3525ad0cb63c", "003d9c73437542dd9c4c59a3730ef696", "bfb2829000de43028c4922ecf2344134", "ce74e7478bef4ca987232389d94a89ee", "1e8b918d21ea44268fb1112f8fd1007f" ] }, "id": "Rkke0ati-JJA", "outputId": "bbfc3967-239e-435d-c777-ebfbffe033a8" }, "execution_count": 23, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "Map: 0%| | 0/9094 [00:00 BACKGROUND OF THE INVENTION A network interface device permits a subscriber to access a network. A passive optical network (PON) is an example of a network capable of delivering voice, video and other data among multiple network subscribers, using a common optical fiber link. Passive optical splitters and combiners enable multiple optical network terminals (ONTs) to share the optical fiber link. In a PON, each ONT terminates the optical fiber link for a residential or business subscriber, and is sometimes referred to as a subscriber premises node that delivers Fiber to the Premises (FTTP) services. An ONT is connected to one or more subscriber devices, such as televisions, set-top boxes, telephones, computers, or network appliances, which ultimately receive the voice, video and data delivered vii the PON. An ONT is an example of a network interface, device. Other examples of a network interface device, in different network types, include cable modems and digital subscriber line (DSL) boxes. Generally, a network also includes a network access interface. In a PON, the network access interface is sometimes referred to as an optical line terminator (OLT), having multiple, independent PON interface modules that serve multiple optical fiber links. A PON interface module provides an interface for transmission and reception of data packets over a particular optical fiber link that serves a group of ONTs. A PON is a downstream-multicast medium. Each packet transmitted on an optical fiber link can be received by every ONT served by that link. ONTs identify selected packets or frames on the fiber link based on addressing information included within the packets or frames. Network equipment, such as network interface devices, in a cable or hybrid network may be connected to power provided by a central office (CO), which commonly utilizes battery and generator back-up power to maintain a continuous power supply. In contrast, an ONT in an all-fiber optic network is ordinarily powered locally at the subscriber premises. For this reason, an ONT often includes a battery to provide backup power during a power outage to maintain critical services, such as voice service. Conventionally, the fibre of a PON typically terminates at a street cabinet to be shared by a number of subscriber equipment. The street cabinet houses an optical network terminal (ONT). The last few meters or kilometer from the street cabinet to a subscriber's home is typically bridged using existing twisted pair copper cables or radio links. The bandwidth resources of the fibre to the street cabinet are typically shared amongst a group of subscribers using an Ethernet switch. For example the fibre may extend to a street cabinet, a kerb outside a subscribers home, or directly into the subscribers home itself. Due to the bulkiness, size and complexity of the ONT cabinets are all factors that increase design difficulty and accrue additional costs. Also, the ONT itself is valuable, and its mounting on a wall, especially outside, makes it susceptible to theft or to being accidentally knocked down. Therefore, it would be desirable to have a compact optical network terminal to make passive optical networks seamlessly connected to regular computers and any other systems to overcome the above restrictions.\"],\n", " 'summary': [' SUMMARY OF THE INVENTION An aspect of the present invention is to address at least the above-mentioned problems and/or disadvantages and to provide at least the advantages described below. Accordingly, an aspect of the present invention is to provide a compact optical network terminal, comprising a first interface coupled to a communications network, a second interface coupled to a network client and a processor including a circuitry and a memory coupled to the first interface and to the second interface, wherein the processor is capable of converting optical signals to electric signals, such that the network client can access the communications network. Other aspects, advantages, and salient features of the invention will become apparent to those skilled in the art from the following detailed description, which, taken in conjunction with the annexed drawings, discloses exemplary embodiments of the invention.'],\n", " 'description': [\"FIELD OF THE INVENTION The present invention relates to the field of passive optical network (PON), and in particular, to an optical network terminal (ONT) in the PON system. BACKGROUND OF THE INVENTION A network interface device permits a subscriber to access a network. A passive optical network (PON) is an example of a network capable of delivering voice, video and other data among multiple network subscribers, using a common optical fiber link. Passive optical splitters and combiners enable multiple optical network terminals (ONTs) to share the optical fiber link. In a PON, each ONT terminates the optical fiber link for a residential or business subscriber, and is sometimes referred to as a subscriber premises node that delivers Fiber to the Premises (FTTP) services. An ONT is connected to one or more subscriber devices, such as televisions, set-top boxes, telephones, computers, or network appliances, which ultimately receive the voice, video and data delivered vii the PON. An ONT is an example of a network interface, device. Other examples of a network interface device, in different network types, include cable modems and digital subscriber line (DSL) boxes. Generally, a network also includes a network access interface. In a PON, the network access interface is sometimes referred to as an optical line terminator (OLT), having multiple, independent PON interface modules that serve multiple optical fiber links. A PON interface module provides an interface for transmission and reception of data packets over a particular optical fiber link that serves a group of ONTs. A PON is a downstream-multicast medium. Each packet transmitted on an optical fiber link can be received by every ONT served by that link. ONTs identify selected packets or frames on the fiber link based on addressing information included within the packets or frames. Network equipment, such as network interface devices, in a cable or hybrid network may be connected to power provided by a central office (CO), which commonly utilizes battery and generator back-up power to maintain a continuous power supply. In contrast, an ONT in an all-fiber optic network is ordinarily powered locally at the subscriber premises. For this reason, an ONT often includes a battery to provide backup power during a power outage to maintain critical services, such as voice service. Conventionally, the fibre of a PON typically terminates at a street cabinet to be shared by a number of subscriber equipment. The street cabinet houses an optical network terminal (ONT). The last few meters or kilometer from the street cabinet to a subscriber's home is typically bridged using existing twisted pair copper cables or radio links. The bandwidth resources of the fibre to the street cabinet are typically shared amongst a group of subscribers using an Ethernet switch. For example the fibre may extend to a street cabinet, a kerb outside a subscribers home, or directly into the subscribers home itself. Due to the bulkiness, size and complexity of the ONT cabinets are all factors that increase design difficulty and accrue additional costs. Also, the ONT itself is valuable, and its mounting on a wall, especially outside, makes it susceptible to theft or to being accidentally knocked down. Therefore, it would be desirable to have a compact optical network terminal to make passive optical networks seamlessly connected to regular computers and any other systems to overcome the above restrictions. SUMMARY OF THE INVENTION An aspect of the present invention is to address at least the above-mentioned problems and/or disadvantages and to provide at least the advantages described below. Accordingly, an aspect of the present invention is to provide a compact optical network terminal, comprising a first interface coupled to a communications network, a second interface coupled to a network client and a processor including a circuitry and a memory coupled to the first interface and to the second interface, wherein the processor is capable of converting optical signals to electric signals, such that the network client can access the communications network. Other aspects, advantages, and salient features of the invention will become apparent to those skilled in the art from the following detailed description, which, taken in conjunction with the annexed drawings, discloses exemplary embodiments of the invention. BRIEF DESCRIPTION OF THE DRAWINGS The above and other aspects, features, and advantages of certain exemplary embodiments of the present invention will be more apparent from the following description taken in conjunction with the accompanying drawings in which: FIG. 1A is a mechanical diagram of an optical network terminal (ONT) typical of customer premises equipment (CPE). FIG. 1B is a mechanical diagram of the ONT of FIG. 1A attached to a mounting bracket. FIG. 2 shows a typical Passive Optical Network (PON) Architecture. FIG. 3 shows a compatible optical network terminal (ONT) according to one embodiment of the present invention. FIG. 4 is a diagrammatic system view of a data processing system in which any of the embodiments disclosed herein may be performed. Persons skilled in the art will appreciate that elements in the figures are illustrated for simplicity and clarity and may have not been drawn to scale. For example, the dimensions of some of the elements in the figure may be exaggerated relative to other elements to help to improve understanding of various exemplary embodiments of the present disclosure. Throughout the drawings, it should be noted that like reference numbers are used to depict the same or similar elements, features, and structures. DETAIL DESCRIPTION OF THE INVENTION The following description with reference to the accompanying drawings is provided to assist in a comprehensive understanding of exemplary embodiments of the invention as defined by the claims and their equivalents. It includes various specific details to assist in that understanding but′ these are to be regarded as merely exemplary. Accordingly, those of ordinary skill in the art will recognize that various changes and modifications of the embodiments described herein can be made without departing from the scope and spirit of the invention. In addition, descriptions of well-known functions and constructions are omitted for clarity and conciseness. The terms and words used in the following description and claims are not limited to the bibliographical meanings, but, are merely used by the inventor to enable a clear and consistent understanding of the invention. Accordingly, it should be apparent to those skilled in the art that the following description of exemplary embodiments of the present invention are provided for illustration purpose only and not for the purpose of limiting the invention as defined by the appended claims and their equivalents. It is to be understood that the singular forms “a,” “an,” and “the” include plural referents unless the context clearly dictates otherwise. Thus, for example, reference to “a component surface” includes reference to one or more of such surfaces. By the term “substantially” it is meant that the recited characteristic, parameter, or value need not be achieved exactly, but that deviations or variations, including for example, tolerances, measurement error, measurement accuracy limitations and other factors known to those of skill in the art, may occur in amounts that do not preclude the effect the characteristic was intended to provide. FIGS. 1 through 4, discussed below, and the various embodiments used to describe the principles of the present disclosure in this patent document are by way of illustration only and should not be construed in any way that would limit the scope of the disclosure. Those skilled in the art will understand that the principles of the present disclosure may be implemented in any suitably arranged communications system. The terms used to describe various embodiments are exemplary. It should be understood that these are provided to merely aid the understanding of the description, and that their use and definitions in no way limit the scope of the invention. Terms first, second, and the like are used to differentiate between objects having the same terminology and are in no way intended to represent a chronological order, unless where explicitly stated otherwise. A set is defined as a non-empty set including at least one element. FIG. 1A shows an optical network terminal (ONT) 100, which is an example of customer premises equipment (CPE), that connects a customer's communications equipment, e.g., computers, telephones, and televisions, to a telecommunications service provider. The ONT 100 includes an outer case 102 with an engagable cover 104 that covers a battery compartment (not shown) or another cavity of the ONT 100. A face 106 of the ONT 100 carries various connectors, including a power connector 108, coaxial cable connector 110, fiber optic cable connector 112, Ethernet (CAT-5) connector 114, and two telephone connectors 116. The ONT 100 transmits data to and receives data from a telecommunications network (not shown) via a fiber optic cable (not shown) connected to a fiber optic cable connector 112. Televisions, computers, and telephones on the customer's premises may be connected to the coaxial cable connector 110, Ethernet connector 114, and telephone connectors 116, respectively, on the ONT 100. FIG. 1B shows the ONT 100 of FIG. 1A with connector details with a bracket 120 attached to the outer case 102. The bracket 120 may be mounted to a wall (not shown), and the ONT 100 may be hung on the bracket. In many applications, the bracket 120 is installed on an exterior wall of a building or inside a garage, locations at which the ONT may be exposed to large temperature variations and different weather conditions. FIG. 2 shows a general Passive Optical Network (PON) Architecture. The elements of a PON are (i) Optical Line Terminal (OLT) 210 (ii) Passive Optical Splitter 220 and (iii) Optical Network Unit (ONU) 230. The Optical Line Terminal 210 is the main element of the network and is usually placed in the Local Exchange. It is a network element with PON line card, basically a aggregation switch. It works as an interface between core network and PON network. Optical Splitter 220 is a passive device with single input and multiple outputs. Optical power at input is split evenly between outputs. Not only signal travels from input to the outputs, signal can also travel from the output to the input. Splitters can be placed anywhere in between Central Office (CO) and Subscriber premises. It is used to connect an optical port of OLT with multiple subscribers. Optical Network units (ONUs) 230 serve as an interface to the network and are deployed at customer premises 240. It provides several interfaces for accessing triple play services and in the upper side it connects with the OLT via optical splitter. Although PONs can exist in three basic configuration (tree, bus and ring), the tree topology is favored due to smaller variation in the signal power from different end station. PON uses 1490 nm for the downstream wavelength and 1310 nm for the upstream wavelength. Signals are inserted or extracted from the fibre using a coarse wavelength division multiplexer (CWDM) filter at the CO and subscriber premises. FIG. 3 shows a compatible optical network terminal (ONT) according to one embodiment of the present invention. The optical network terminal (ONT) 300 includes a first interface 310, a second interface 320 and a middle region 330 sandwiched between the first and second interface. The first interface 310 coupled to a communications network 340, a second interface 320 coupled to a network client 350. The first interface is connected through a dedicated optical fiber link 360 (bi-directional) to receive optical signals from one or more communication network 340. The communication network may be or may include one or more but not limited to any of the xPON network 340 (e.g. of a broadband passive optical network (BPON), a gigabit-capable passive optical network (GPON), an Ethernet passive optical network (EPON), a gigabit-capable Ethernet passive optical network (GEPON), an active Ethernet optical network and any other future passive optical networks etc). The second interface 320 is coupled to the network client 350 though a USB port. In an operation, the middle region which may be a processor 330 including a memory (not shown in figure) coupled to the first interface 310 and to the second interface 320, wherein the processor 330 includes a circuitry which is configured for converting optical signals to electric signals, such that the network client can access the communications network. The first interface 310 may include an optical module (not shown in figure) which receives optical signals via the optical fiber link 360 and capable of converting the optical signals to electrical signals. The second interface 320 may include a control circuit (not shown in figure) which is capable of receiving the power from the network client 350 for processing the received electrical signals thereby reducing the required protocol processing time from the network client. Due to this behavior of the second interface 320 results in simplifying the ONT design by offloading the “non-volatile” part of the software to the network client 350 and downloading it on power to turn it. Most of the backend work can also be done by a software driver residing in the network client. Further, the second interface 320 acts as a network connectivity dongle with an optical transceiver at one end. Furthermore, the second interface may include a Universal Serial Bus (USB) jack which is couplable to Universal Serial Bus (USB) plug or connector of the network client 350. The second interface 320 capable of power up the “dongle” to connect it to the central office or Optical Line Terminal (OLT) by excluding external power source as required in the conventional design of ONT. In an example operation the Optical Network Terminal. (ONT) is connected to the network client through a USB port. Once the USB port of the network client 360 is coupled to the USB interface i.e. second interface 320, one or more driver needs to be installed at the network client 360 which then onwards controls the USB dongle (ONT) with the configured parameters at the installation time. The software boots up the USB dongle and communicates to network client 360 as a memory device with a built-in driver. The xPON protocol selected at the network client 360 will run and then converts the data coming from the WAN/LAN side to network client 360 as a network device. Once the software starts running in the network client 360, it would get connected to the OLT using the required xPON protocol. Once the network client 360 and the xPON network are connected, each network client 360 will have a dedicated connection (e.g. speed, bandwidth etc) as requested or selected by the client side. By this kind of novel and compatible design i.e. having xPON interface on one side and USB protocol interface on the other side will eradicate the necessity of the external power for the ONT. Also, by this kind of compatible design reduce the unnecessary splitting of equal upstream wavelength to all the network clients in the network. The network client may be or may include a host computer, a optical network unit, a optical network terminal or any other unit or terminal or device which is capable of accessing the passive optical network (xPON). FIG. 4 is a diagrammatic system view 400 of a data processing system in which any of the embodiments disclosed herein may be performed, according to one embodiment. Particularly, the diagrammatic system view of FIG. 4 illustrates a processor 402, a main memory 404, a static memory 406, a bus 408, a video display 410, an alpha-numeric input device 412, a cursor control device 414, a drive unit 416, a signal generation device 418, a network interface device 420, a machine readable medium 422, instructions 424 and a network 426. The diagrammatic system view 400 may indicate a personal computer and/or a data processing system in which one or more operations disclosed herein are performed. The processor 402 may be a microprocessor, a state machine, an application specific integrated circuit, a field programmable gate array; etc. (e.g., Intel® Pentium® processor). The main memory 404 may be a dynamic random access memory and/or a primary memory of a computer system. The static memory 406 may be a hard drive, a flash drive, and/or other memory information associated with the data processing system. The bus 408 may be an interconnection between various circuits and/or structures of the data processing system. The video display 410 may provide graphical representation of information on the data processing system. The alpha-numeric input device 412 may be a keypad, keyboard and/or any other input device of text (e.g., a special device to aid the physically handicapped). The cursor control device 414 may be a pointing device such as a mouse. The drive unit 416 may be a hard drive, a storage system, and/or other longer term storage subsystem. The signal generation device 418 may be a bios and/or a functional operating system of the data processing system. The network interface device 420 may perform interface functions (e.g., code conversion, protocol conversion, and/or buffering) required for communications to and from the network 426 between a number of independent devices (e.g., of varying protocols). The machine readable medium 422 may provide instructions on which any of the methods disclosed herein may be performed. The instructions 424 may provide source code and/or data code to the processor 402 to enable any one/or more operations disclosed herein. FIGS. 1-4 are merely representational and are not drawn to scale. Certain portions thereof may be exaggerated, while others may be minimized. FIGS. 1-4 illustrate various embodiments of the invention that can be understood and appropriately carried out by those of ordinary skill in the art. In the foregoing detailed description of embodiments of the invention, various features are grouped together in a single embodiment for the purpose of streamlining the disclosure. This method of disclosure is not to be interpreted as reflecting an intention that the claimed embodiments of the invention require more features than are expressly recited in each claim. Rather, as the following claims reflect, inventive subject matter lies in less than all features of a single disclosed embodiment. Thus, the following claims are hereby incorporated into the detailed description of embodiments of the invention, with each claim standing on its own as a separate embodiment. It is understood that the above description is intended to be illustrative, and not restrictive. It is intended to cover all alternatives, modifications and equivalents as may be included within the spirit and scope of the invention as defined in the appended claims. Many other embodiments will be apparent to those of skill in the art upon reviewing the above description. The scope of the invention should, therefore, be determined with reference to the appended claims, along with the full scope of equivalents to which such claims are entitled. In the appended claims, the terms “including” and “in which” are used as the plain-English equivalents of the respective terms “comprising” and “wherein,” respectively.\"],\n", " 'cpc_label': ['H04Q110071'],\n", " 'ipc_label': ['H04Q1100'],\n", " 'filing_date': ['20160120'],\n", " 'patent_issue_date': ['20170606'],\n", " 'date_published': ['20160526'],\n", " 'examiner_id': ['95191.0'],\n", " 'input_ids': [[101,\n", " 1015,\n", " 1012,\n", " 1037,\n", " 9233,\n", " 9380,\n", " 2897,\n", " 5536,\n", " 1010,\n", " 9605,\n", " 1024,\n", " 1037,\n", " 2034,\n", " 8278,\n", " 11211,\n", " 2000,\n", " 1037,\n", " 4806,\n", " 2897,\n", " 1025,\n", " 1037,\n", " 2117,\n", " 8278,\n", " 11211,\n", " 2000,\n", " 1037,\n", " 2897,\n", " 7396,\n", " 1010,\n", " 16726,\n", " 1996,\n", " 2117,\n", " 8278,\n", " 2003,\n", " 1037,\n", " 2897,\n", " 20831,\n", " 11947,\n", " 2571,\n", " 2007,\n", " 2019,\n", " 9380,\n", " 9099,\n", " 3401,\n", " 16402,\n", " 2012,\n", " 2028,\n", " 2203,\n", " 1025,\n", " 1998,\n", " 1037,\n", " 13151,\n", " 2164,\n", " 1037,\n", " 4984,\n", " 2854,\n", " 1998,\n", " 1037,\n", " 3638,\n", " 11211,\n", " 2000,\n", " 1996,\n", " 2034,\n", " 8278,\n", " 1998,\n", " 2000,\n", " 1996,\n", " 2117,\n", " 8278,\n", " 1010,\n", " 16726,\n", " 1996,\n", " 13151,\n", " 2003,\n", " 5214,\n", " 1997,\n", " 16401,\n", " 9380,\n", " 7755,\n", " 2000,\n", " 3751,\n", " 7755,\n", " 1010,\n", " 2107,\n", " 2008,\n", " 1996,\n", " 2897,\n", " 7396,\n", " 2064,\n", " 3229,\n", " 1996,\n", " 4806,\n", " 2897,\n", " 8558,\n", " 8161,\n", " 1996,\n", " 14203,\n", " 14541,\n", " 1997,\n", " 5020,\n", " 13909,\n", " 29263,\n", " 2000,\n", " 2035,\n", " 1996,\n", " 2897,\n", " 7846,\n", " 1999,\n", " 1996,\n", " 2897,\n", " 1012,\n", " 1016,\n", " 1012,\n", " 1996,\n", " 9380,\n", " 2897,\n", " 5536,\n", " 1997,\n", " 4366,\n", " 1015,\n", " 1010,\n", " 16726,\n", " 1996,\n", " 2034,\n", " 8278,\n", " 2950,\n", " 2019,\n", " 9380,\n", " 11336,\n", " 2008,\n", " 8267,\n", " 9380,\n", " 7755,\n", " 3081,\n", " 1996,\n", " 9380,\n", " 11917,\n", " 4957,\n", " 1998,\n", " 19884,\n", " 1996,\n", " 9380,\n", " 7755,\n", " 2000,\n", " 5992,\n", " 7755,\n", " 1012,\n", " 1017,\n", " 1012,\n", " 1996,\n", " 9380,\n", " 2897,\n", " 5536,\n", " 1997,\n", " 4366,\n", " 1016,\n", " 1010,\n", " 16726,\n", " 1996,\n", " 9380,\n", " 11336,\n", " 2003,\n", " 13228,\n", " 2135,\n", " 9530,\n", " 8873,\n", " 27390,\n", " 3085,\n", " 2000,\n", " 2490,\n", " 2048,\n", " 2030,\n", " 2062,\n", " 1997,\n", " 1037,\n", " 19595,\n", " 13135,\n", " 9380,\n", " 2897,\n", " 1006,\n", " 17531,\n", " 2239,\n", " 1007,\n", " 1010,\n", " 1037,\n", " 15453,\n", " 28518,\n", " 2102,\n", " 1011,\n", " 5214,\n", " 13135,\n", " 9380,\n", " 2897,\n", " 1006,\n", " 14246,\n", " 2239,\n", " 1007,\n", " 1010,\n", " 2019,\n", " 26110,\n", " 13135,\n", " 9380,\n", " 2897,\n", " 1006,\n", " 4958,\n", " 2239,\n", " 1007,\n", " 1010,\n", " 1037,\n", " 15453,\n", " 28518,\n", " 2102,\n", " 1011,\n", " 5214,\n", " 26110,\n", " 13135,\n", " 9380,\n", " 2897,\n", " 1006,\n", " 16216,\n", " 26029,\n", " 1007,\n", " 1998,\n", " 2019,\n", " 3161,\n", " 26110,\n", " 9380,\n", " 2897,\n", " 1012,\n", " 1018,\n", " 1012,\n", " 1996,\n", " 9380,\n", " 2897,\n", " 5536,\n", " 1997,\n", " 4366,\n", " 1015,\n", " 1010,\n", " 16726,\n", " 1996,\n", " 2897,\n", " 7396,\n", " 2950,\n", " 1037,\n", " 10463,\n", " 2121,\n", " 3131,\n", " 2005,\n", " 16401,\n", " 2012,\n", " 2560,\n", " 2070,\n", " 1997,\n", " 1996,\n", " 5992,\n", " 7755,\n", " 2000,\n", " 2951,\n", " 3197,\n", " 2029,\n", " 2003,\n", " 13228,\n", " 2135,\n", " 9530,\n", " 8873,\n", " 27390,\n", " 3085,\n", " 2000,\n", " 2490,\n", " 1037,\n", " 29018,\n", " 1997,\n", " 9380,\n", " 2897,\n", " 16744,\n", " 1012,\n", " 1019,\n", " 1012,\n", " 1996,\n", " 9380,\n", " 1010,\n", " 2897,\n", " 5536,\n", " 1997,\n", " 4366,\n", " 1015,\n", " 1010,\n", " 16726,\n", " 1996,\n", " 2117,\n", " 8278,\n", " 2950,\n", " 1037,\n", " 2491,\n", " 4984,\n", " 2854,\n", " 2029,\n", " 2003,\n", " 5214,\n", " 1997,\n", " 4909,\n", " 1996,\n", " 2373,\n", " 2013,\n", " 1996,\n", " 2897,\n", " 7396,\n", " 2005,\n", " 6364,\n", " 1996,\n", " 2363,\n", " 5992,\n", " 7755,\n", " 8558,\n", " 8161,\n", " 1996,\n", " 3223,\n", " 8778,\n", " 6364,\n", " 2051,\n", " 2013,\n", " 1996,\n", " 2897,\n", " 7396,\n", " 1012,\n", " 1020,\n", " 1012,\n", " 1996,\n", " 9380,\n", " 2897,\n", " 5536,\n", " 1997,\n", " 4366,\n", " 1015,\n", " 1010,\n", " 16726,\n", " 1996,\n", " 2897,\n", " 7396,\n", " 2003,\n", " 5214,\n", " 1997,\n", " 6364,\n", " 1996,\n", " 26726,\n", " 2239,\n", " 16744,\n", " 2000,\n", " 10639,\n", " 2007,\n", " 2028,\n", " 2030,\n", " 2062,\n", " 9380,\n", " 2240,\n", " 5536,\n", " 1006,\n", " 19330,\n", " 2102,\n", " 1007,\n", " 1012,\n", " 1021,\n", " 1012,\n", " 1006,\n", " 13261,\n", " 1007,\n", " 1022,\n", " 1012,\n", " 1996,\n", " 9380,\n", " 2897,\n", " 5536,\n", " 1997,\n", " 4366,\n", " 1015,\n", " 1010,\n", " 16726,\n", " 1996,\n", " 2117,\n", " 8278,\n", " 2950,\n", " 1037,\n", " 5415,\n", " 7642,\n", " 3902,\n", " 1006,\n", " 18833,\n", " 1007,\n", " 2990,\n", " 2029,\n", " 2003,\n", " 8648,\n", " 20470,\n", " 2571,\n", " 2000,\n", " 5415,\n", " 7642,\n", " 3902,\n", " 1006,\n", " 18833,\n", " 1007,\n", " 13354,\n", " 2030,\n", " 19400,\n", " 1997,\n", " 1996,\n", " 2897,\n", " 7396,\n", " 1012,\n", " 1023,\n", " 1012,\n", " 1996,\n", " 9380,\n", " 2897,\n", " 5536,\n", " 1997,\n", " 4366,\n", " 1015,\n", " 1010,\n", " 16726,\n", " 1996,\n", " 2012,\n", " 2560,\n", " 2028,\n", " 4807,\n", " 2326,\n", " 2007,\n", " 1996,\n", " 26726,\n", " 2239,\n", " 2897,\n", " 8681,\n", " 1037,\n", " 2034,\n", " 4807,\n", " 2326,\n", " 1998,\n", " 1037,\n", " 2117,\n", " 4807,\n", " 2326,\n", " 1010,\n", " 1998,\n", " 16726,\n", " 1996,\n", " 4807,\n", " 2326,\n", " 2950,\n", " 2012,\n", " 2560,\n", " 2028,\n", " 2376,\n", " 4807,\n", " 2326,\n", " 1010,\n", " 1037,\n", " 2951,\n", " 4807,\n", " 2326,\n", " 1010,\n", " 1998,\n", " 1037,\n", " 2678,\n", " 2326,\n", " 1012,\n", " 2184,\n", " 1012,\n", " 1006,\n", " 13261,\n", " 1007,\n", " 102,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0]],\n", " 'attention_mask': [[1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 1,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0,\n", " 0]]}" ] }, "metadata": {}, "execution_count": 24 } ] }, { "cell_type": "code", "source": [ "# Set the format\n", "train_set.set_format(type='torch',\n", " columns=['input_ids', 'attention_mask', 'decision'])\n", "\n", "val_set.set_format(type='torch',\n", " columns=['input_ids', 'attention_mask', 'decision'])" ], "metadata": { "id": "cclVA5qr0XWp" }, "execution_count": 25, "outputs": [] }, { "cell_type": "markdown", "source": [ "## Dataloader to create the training set and validation set loaders" ], "metadata": { "id": "tladb8wJ0bOD" } }, { "cell_type": "code", "source": [ "# train_dataloader and val_data_loader\n", "train_dataloader = DataLoader(train_set, batch_size=16)\n", "val_dataloader = DataLoader(val_set, batch_size=16)" ], "metadata": { "id": "ycr-gn3B0Zpx" }, "execution_count": 26, "outputs": [] }, { "cell_type": "code", "source": [ "# Get the next batch\n", "batch = next(iter(train_dataloader))\n", "# Print the ids\n", "pprint(batch['input_ids'])\n", "# Print the labels\n", "pprint(batch['decision'])" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "ISY7NybI0iaM", "outputId": "e50a90b2-a739-4f9c-e28f-5d001266bae5" }, "execution_count": 27, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "tensor([[ 101, 1015, 1012, ..., 0, 0, 0],\n", " [ 101, 1015, 1012, ..., 1996, 3653, 102],\n", " [ 101, 1015, 1012, ..., 16726, 1996, 102],\n", " ...,\n", " [ 101, 1015, 1012, ..., 1012, 1996, 102],\n", " [ 101, 1015, 1012, ..., 2034, 28688, 102],\n", " [ 101, 1015, 1012, ..., 2000, 4366, 102]])\n", "tensor([1, 1, 2, 1, 0, 1, 2, 0, 1, 1, 1, 2, 2, 2, 0, 1])\n" ] } ] }, { "cell_type": "code", "source": [ "# Print the input and output shapes\n", "input_shape = batch['input_ids'].shape\n", "output_shape = batch['decision'].shape\n", "print(f'Input shape: {input_shape}')\n", "print(f'Output shape: {output_shape}')" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "RLojYySe0lC9", "outputId": "7b201785-d59d-46e5-f154-1866c748dd02" }, "execution_count": 28, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Input shape: torch.Size([16, 512])\n", "Output shape: torch.Size([16])\n" ] } ] }, { "cell_type": "code", "source": [ "# A helper function that converts ids into tokens\n", "def convert_ids_to_string(tokenizer, input):\n", " return ' '.join(tokenizer.convert_ids_to_tokens(input))" ], "metadata": { "id": "_hKij3wk0n4U" }, "execution_count": 29, "outputs": [] }, { "cell_type": "markdown", "source": [ "print an example in the batch" ], "metadata": { "id": "R0PAyrkv0qaR" } }, { "cell_type": "code", "source": [ "# Print the example\n", "pprint(convert_ids_to_string(tokenizer,batch['input_ids'][1]))" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "01u3V6T40uMM", "outputId": "cf572ef0-0e63-4c33-8428-34f18cab0d6a" }, "execution_count": 30, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "('[CLS] 1 . a method comprising : using a first reader to take a first reading '\n", " 'of an inherent disorder feature of a tag ; using at least a second reader to '\n", " 'take at least a second reading of the inherent disorder feature of the tag ; '\n", " 'matching the first reading with at least the second reading ; determining '\n", " 'one or more acceptance criteria , wherein at least one of the acceptance '\n", " 'criteria is based on whether the first reading and the second reading match '\n", " 'within a pre ##de ##ter ##mined threshold ; accepting the tag if the '\n", " 'acceptance criteria are met ; and recording a finger ##print for the tag if '\n", " 'the tag was accepted . 2 . the method of claim 1 , wherein determining one '\n", " 'or more acceptance criteria further comprises : determining an acceptance '\n", " 'criterion based on an individual reading . 3 . the method of claim 2 , '\n", " 'wherein determining an acceptance criterion based on an individual reading '\n", " 'comprises determining an acceptance criterion based on a strength of a '\n", " 'signal in at least one of the first reading and the second reading . 4 . the '\n", " 'method of claim 2 , wherein determining an acceptance criterion based on an '\n", " 'individual reading comprises determining an acceptance criterion based on a '\n", " 'complexity of a signal in at least one of the first reading and the second '\n", " 'reading . 5 . the method of claim 1 , further comprising : rejecting the tag '\n", " 'if it is not accepted . 6 . the method of claim 5 , wherein rejecting the '\n", " 'tag comprises removing the tag without stopping the flow of production . 7 . '\n", " 'the method of claim 6 , wherein removing the tag comprises one or more of '\n", " 'marking the tag as rejected , cutting out the tag , punching out the tag , '\n", " 'and removing a tag using a su ##ction method . 8 . the method of claim 5 , '\n", " 'wherein rejecting the tag further comprises noting the rejected tag in a '\n", " 'database . 9 . the method of claim 1 , further comprising : using at least a '\n", " 'third reader to take at least a third reading of the inherent disorder '\n", " 'feature of the tag if the acceptance criteria are not met ; matching the '\n", " 'third reading with the first reading and the second reading ; determining '\n", " 'one or more further acceptance criteria , wherein at least one of the '\n", " 'further acceptance criteria is based on whether the first reading and the '\n", " 'third reading match within the pre ##de ##ter ##mined threshold or whether '\n", " 'the second reading and the third reading match within the pre ##de ##ter '\n", " '##mined threshold ; and accepting the tag if the further acceptance criteria '\n", " 'are met ; and if the tag is accepted , recording a finger ##print for the '\n", " 'tag based on the first reading if the first reading and the third reading '\n", " 'match within the pre ##de ##ter ##mined threshold or based on the second '\n", " 'reading if the second reading and the third reading match within the pre '\n", " '[SEP]')\n" ] } ] }, { "cell_type": "markdown", "source": [ "## Tune the Model" ], "metadata": { "id": "40CnkXnUnuzU" } }, { "cell_type": "code", "source": [ "model = DistilBertForSequenceClassification.from_pretrained(model_name, num_labels=6)\n", "\n" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "cR-q_5PuUt0x", "outputId": "6d613945-3975-4016-9eca-ca557c27807e" }, "execution_count": 37, "outputs": [ { "output_type": "stream", "name": "stderr", "text": [ "Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['pre_classifier.weight', 'classifier.bias', 'classifier.weight', 'pre_classifier.bias']\n", "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n" ] } ] }, { "cell_type": "code", "source": [ "from torch.utils.data import DataLoader\n", "from transformers import AdamW\n", "\n", "device = torch.device('cuda') if torch.cuda.is_available() else torch.device('cpu')\n", "\n", "model.to(device)\n", "model.train()\n", "\n", "optim = AdamW(model.parameters(), lr=5e-5)\n", "\n", "for epoch in range(3):\n", " for batch in train_dataloader:\n", " optim.zero_grad()\n", " input_ids = batch['input_ids'].to(device)\n", " attention_mask = batch['attention_mask'].to(device)\n", " labels = batch['decision'].to(device)\n", " outputs = model(input_ids, attention_mask=attention_mask, labels=labels)\n", " loss = outputs[0]\n", " loss.backward()\n", " optim.step()\n", "\n", "model.eval()" ], "metadata": { "id": "AXS86iRRahsV" }, "execution_count": null, "outputs": [] }, { "cell_type": "markdown", "source": [ "## Save the tuned model in \"saved\" directory" ], "metadata": { "id": "b-w2IO76d834" } }, { "cell_type": "code", "source": [ "save_directory = \"saved\"\n", "tokenizer.save_pretrained(save_directory)\n", "model.save_pretrained(save_directory)" ], "metadata": { "id": "KefqatP-YDSC" }, "execution_count": 31, "outputs": [] }, { "cell_type": "markdown", "source": [ "References:\n", "\n", "1. https://colab.research.google.com/drive/1_ZsI7WFTsEO0iu_0g3BLTkIkOUqPzCET?usp=sharing#scrollTo=B5wxZNhXdUK6\n", "\n", "2. https://huggingface.co/AI-Growth-Lab/PatentSBERTa\n", "\n", "3. https://huggingface.co/anferico/bert-for-patents\n", "\n", "4. https://huggingface.co/transformers/v3.2.0/custom_datasets.html" ], "metadata": { "id": "s_ryUnFdGB5L" } } ] }