diff --git "a/xlm-roberta.ipynb" "b/xlm-roberta.ipynb" new file mode 100644--- /dev/null +++ "b/xlm-roberta.ipynb" @@ -0,0 +1 @@ +{"cells":[{"cell_type":"code","execution_count":1,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":20058,"status":"ok","timestamp":1696057052179,"user":{"displayName":"Михаил Дворецкий","userId":"05054516382534405435"},"user_tz":-180},"id":"YQE9iI7muSEE","outputId":"d0febd6e-5ef6-4ae0-bb15-c16f2e8ccedd"},"outputs":[{"output_type":"stream","name":"stdout","text":["Collecting transformers\n"," Downloading transformers-4.33.3-py3-none-any.whl (7.6 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m7.6/7.6 MB\u001b[0m \u001b[31m48.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting datasets\n"," Downloading datasets-2.14.5-py3-none-any.whl (519 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m519.6/519.6 kB\u001b[0m \u001b[31m38.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from transformers) (3.12.2)\n","Collecting huggingface-hub<1.0,>=0.15.1 (from transformers)\n"," Downloading huggingface_hub-0.17.3-py3-none-any.whl (295 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m295.0/295.0 kB\u001b[0m \u001b[31m36.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from transformers) (1.23.5)\n","Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from transformers) (23.1)\n","Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from transformers) (6.0.1)\n","Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.10/dist-packages (from transformers) (2023.6.3)\n","Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from transformers) (2.31.0)\n","Collecting tokenizers!=0.11.3,<0.14,>=0.11.1 (from transformers)\n"," Downloading tokenizers-0.13.3-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (7.8 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m7.8/7.8 MB\u001b[0m \u001b[31m99.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting safetensors>=0.3.1 (from transformers)\n"," Downloading safetensors-0.3.3-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (1.3 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.3/1.3 MB\u001b[0m \u001b[31m71.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.10/dist-packages (from transformers) (4.66.1)\n","Requirement already satisfied: pyarrow>=8.0.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (9.0.0)\n","Collecting dill<0.3.8,>=0.3.0 (from datasets)\n"," Downloading dill-0.3.7-py3-none-any.whl (115 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m115.3/115.3 kB\u001b[0m \u001b[31m14.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: pandas in /usr/local/lib/python3.10/dist-packages (from datasets) (1.5.3)\n","Collecting xxhash (from datasets)\n"," Downloading xxhash-3.3.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (194 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m194.1/194.1 kB\u001b[0m \u001b[31m25.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting multiprocess (from datasets)\n"," Downloading multiprocess-0.70.15-py310-none-any.whl (134 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m134.8/134.8 kB\u001b[0m \u001b[31m17.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: fsspec[http]<2023.9.0,>=2023.1.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (2023.6.0)\n","Requirement already satisfied: aiohttp in /usr/local/lib/python3.10/dist-packages (from datasets) (3.8.5)\n","Requirement already satisfied: attrs>=17.3.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (23.1.0)\n","Requirement already satisfied: charset-normalizer<4.0,>=2.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (3.2.0)\n","Requirement already satisfied: multidict<7.0,>=4.5 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (6.0.4)\n","Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (4.0.3)\n","Requirement already satisfied: yarl<2.0,>=1.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.9.2)\n","Requirement already satisfied: frozenlist>=1.1.1 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.4.0)\n","Requirement already satisfied: aiosignal>=1.1.2 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.3.1)\n","Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.15.1->transformers) (4.5.0)\n","Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (3.4)\n","Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (2.0.4)\n","Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (2023.7.22)\n","Requirement already satisfied: python-dateutil>=2.8.1 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets) (2.8.2)\n","Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets) (2023.3.post1)\n","Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.10/dist-packages (from python-dateutil>=2.8.1->pandas->datasets) (1.16.0)\n","Installing collected packages: tokenizers, safetensors, xxhash, dill, multiprocess, huggingface-hub, transformers, datasets\n","Successfully installed datasets-2.14.5 dill-0.3.7 huggingface-hub-0.17.3 multiprocess-0.70.15 safetensors-0.3.3 tokenizers-0.13.3 transformers-4.33.3 xxhash-3.3.0\n"]}],"source":["!pip install transformers datasets"]},{"cell_type":"code","execution_count":2,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":17,"status":"ok","timestamp":1696057052180,"user":{"displayName":"Михаил Дворецкий","userId":"05054516382534405435"},"user_tz":-180},"id":"xAhSzSv4tGKi","outputId":"d5cdc85b-6682-42c7-eae8-041507478bf9"},"outputs":[{"output_type":"stream","name":"stdout","text":["Token will not been saved to git credential helper. Pass `add_to_git_credential=True` if you want to set the git credential as well.\n","Token is valid (permission: write).\n","Your token has been saved to /root/.cache/huggingface/token\n","Login successful\n"]}],"source":["!huggingface-cli login --token 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"]},{"cell_type":"code","source":["!pip install transformers[torch]"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"3fuCLWFPxkFl","executionInfo":{"status":"ok","timestamp":1696057060107,"user_tz":-180,"elapsed":7937,"user":{"displayName":"Михаил Дворецкий","userId":"05054516382534405435"}},"outputId":"9a74689c-dad7-44f8-870b-66357d6afab0"},"execution_count":3,"outputs":[{"output_type":"stream","name":"stdout","text":["Requirement already satisfied: transformers[torch] in /usr/local/lib/python3.10/dist-packages (4.33.3)\n","Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (3.12.2)\n","Requirement already satisfied: huggingface-hub<1.0,>=0.15.1 in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (0.17.3)\n","Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (1.23.5)\n","Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (23.1)\n","Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (6.0.1)\n","Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (2023.6.3)\n","Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (2.31.0)\n","Requirement already satisfied: tokenizers!=0.11.3,<0.14,>=0.11.1 in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (0.13.3)\n","Requirement already satisfied: safetensors>=0.3.1 in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (0.3.3)\n","Requirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (4.66.1)\n","Requirement already satisfied: torch!=1.12.0,>=1.10 in /usr/local/lib/python3.10/dist-packages (from transformers[torch]) (2.0.1+cu118)\n","Collecting accelerate>=0.20.3 (from transformers[torch])\n"," Downloading accelerate-0.23.0-py3-none-any.whl (258 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m258.1/258.1 kB\u001b[0m \u001b[31m3.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: psutil in /usr/local/lib/python3.10/dist-packages (from accelerate>=0.20.3->transformers[torch]) (5.9.5)\n","Requirement already satisfied: fsspec in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.15.1->transformers[torch]) (2023.6.0)\n","Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.15.1->transformers[torch]) (4.5.0)\n","Requirement already satisfied: sympy in /usr/local/lib/python3.10/dist-packages (from torch!=1.12.0,>=1.10->transformers[torch]) (1.12)\n","Requirement already satisfied: networkx in /usr/local/lib/python3.10/dist-packages (from torch!=1.12.0,>=1.10->transformers[torch]) (3.1)\n","Requirement already satisfied: jinja2 in /usr/local/lib/python3.10/dist-packages (from torch!=1.12.0,>=1.10->transformers[torch]) (3.1.2)\n","Requirement already satisfied: triton==2.0.0 in /usr/local/lib/python3.10/dist-packages (from torch!=1.12.0,>=1.10->transformers[torch]) (2.0.0)\n","Requirement already satisfied: cmake in /usr/local/lib/python3.10/dist-packages (from triton==2.0.0->torch!=1.12.0,>=1.10->transformers[torch]) (3.27.4.1)\n","Requirement already satisfied: lit in /usr/local/lib/python3.10/dist-packages (from triton==2.0.0->torch!=1.12.0,>=1.10->transformers[torch]) (16.0.6)\n","Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests->transformers[torch]) (3.2.0)\n","Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->transformers[torch]) (3.4)\n","Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->transformers[torch]) (2.0.4)\n","Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->transformers[torch]) (2023.7.22)\n","Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.10/dist-packages (from jinja2->torch!=1.12.0,>=1.10->transformers[torch]) (2.1.3)\n","Requirement already satisfied: mpmath>=0.19 in /usr/local/lib/python3.10/dist-packages (from sympy->torch!=1.12.0,>=1.10->transformers[torch]) (1.3.0)\n","Installing collected packages: accelerate\n","Successfully installed accelerate-0.23.0\n"]}]},{"cell_type":"code","execution_count":4,"metadata":{"executionInfo":{"elapsed":10255,"status":"ok","timestamp":1696057070335,"user":{"displayName":"Михаил Дворецкий","userId":"05054516382534405435"},"user_tz":-180},"id":"YoYMH8g6tl77"},"outputs":[],"source":["from transformers import AutoTokenizer, TrainingArguments, Trainer, AutoModelForQuestionAnswering\n","import pandas as pd\n","from transformers import DefaultDataCollator\n","from datasets import Dataset"]},{"cell_type":"code","execution_count":5,"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":317,"referenced_widgets":["6a9405378a2c4b768198bec703b6c5ed","ff31f8dba656432c9eba301e4decd6fd","5009a50415b34664bbbdb97dd13f4a08","776a34370620464cac886019dd9b20b9","d3b72b3110484652938c1866a2425e66","ad634cd3a4e54436b2c9deb3e67c587e","639d04ab4a154aea9d89a2b82d594a75","9829e2d444664b24a123dd12fb60b45c","7e1fff101381474eaf784849b63a492a","e3f4c5837c2a40e4b1b69aae4551818b","ccc1ba717346441784201a8374b37eef","787e83175dc544259751c526731adfc3","f4d48177fd4b4ef8810b270b51f65058","d458f015e0264adab4a6a4143bf3b0fa","8277a542522c4c18b8b5287b0c7e4c50","ca708c4952154b789228f5e30ca8b6bc","a975eafbb45c4d898a121e4f7471c523","ba9f9de1cd73492482eb3eb51907f8cc","5a098c18bb72449d92367f7c2bf35f30","cd3ae104e9584b238881d2d8d125cf82","ff388bc683974a6e88bd5df073bd7773","6b7b3937368949599a572b9509cc4392","de5b1372628741eca6e49bf226b54fe7","06fa804ff03e4f77b96ba0669234f0e0","8358f38bb15149fc984cb2c70733997c","d44d054f85f14e7d947963543a7b9260","eba18c15d71b466c84c366c2efd0be1d","33257c3f1cf840c59660b2e3c80a0b3e","c7b581a0e0804a999eb807d4408128ff","40f5000ca9024076b950a7e26538ac05","d721928ea4b24cc28b250fd3eb80a6ee","8732ac9c9098488e9c6065162fb29991","f1b9aefa512d4763ab6e372eb4ce9a5d","783b1e764d994dcebd1cfaeabfdda844","1fb77166964443a6aed1863d36933c4b","e32a281517344ae09449be971eb67da7","c291262f0ad74a2f95d24ef00a5da470","e739dee905d845978505c7807d1c522a","7020eba8292e4e78a099185032d9c538","8b1b641792bc419e88d0db49ec4d4e90","1877325aa28b48ff8d9c97d672b52b2c","a22d7aadf5bb4f62b4b825827fd3f9a7","92f2f3c007fd4705b6945a6c4570db0e","c57cff14464c4f209fcc033194e7b1c3","55213581b1fd4339b78d5dc023d952c3","c1aa6eb05acc44a4a01ee9d0217d3b91","1c64e45f9ded444abab117e2d6e1fdc6","b5010912d9a6491498f1d7980fffe1ba","acd25676ea744dd49fbfabb4d8e793f9","e077ea61963f407fb13e2fe9cd542230","214dda72ea174daaa6bbdea2f3a22a95","a39d8a50eb6f479883add717bdceee94","e8ddabe424394525882925b9b912a0d4","60ac7cd117f2421d98af0874ccf90996","11e017ac2fee4fa2a291e8e71ba74894"]},"executionInfo":{"elapsed":5231,"status":"ok","timestamp":1696057075558,"user":{"displayName":"Михаил Дворецкий","userId":"05054516382534405435"},"user_tz":-180},"id":"RwEBZ6YGtrGP","outputId":"c980ce7e-c4ab-455f-824a-e23b667e6271"},"outputs":[{"output_type":"display_data","data":{"text/plain":["Downloading (…)okenizer_config.json: 0%| | 0.00/516 [00:00 end_char[i] or offset[context_end][1] < start_char[i]:\n"," start_positions.append(0)\n"," end_positions.append(0)\n"," else:\n"," # Otherwise it's the start and end token positions\n"," idx = context_start\n"," while idx <= context_end and offset[idx][0] <= start_char[i]:\n"," idx += 1\n"," start_positions.append(idx - 1)\n","\n"," idx = context_end\n"," while idx >= context_start and offset[idx][1] >= end_char[i]:\n"," idx -= 1\n"," end_positions.append(idx + 1)\n","\n"," inputs[\"start_positions\"] = start_positions\n"," inputs[\"end_positions\"] = end_positions\n"," return inputs"]},{"cell_type":"code","execution_count":10,"metadata":{"executionInfo":{"elapsed":1112,"status":"ok","timestamp":1696057101748,"user":{"displayName":"Михаил Дворецкий","userId":"05054516382534405435"},"user_tz":-180},"id":"lFLCNe6Vt0Yk"},"outputs":[],"source":["data = Dataset.from_dict(preprocessing(data))"]},{"cell_type":"code","execution_count":11,"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":77,"referenced_widgets":["6c0f9224645f43c093c2d355fdee335d","cad7db9c8546411bbce1f3abf250058d","b30767e8371c45209ce78372425556f2","0e0d5cdcd8d14cd38edee1a9d7e259f4","334499cf1e29446b9d0241d6c59552bd","8a10971754004930836fe820e49b212d","ed43aadb6c5449d78d6a75deab809bf4","66dc2621a32c4364b9879a4f7e2457f0","ab1733d7a1fb4abca477eac077a51047","6dca6550bef84edb90542ded37fb0abf","40e0081f38ed4a93af5eeb8b6f728619"]},"id":"h8jfXolgt3XJ","executionInfo":{"status":"ok","timestamp":1696057127991,"user_tz":-180,"elapsed":25705,"user":{"displayName":"Михаил Дворецкий","userId":"05054516382534405435"}},"outputId":"eb584389-bef6-4007-ded2-bfa92f2bac4b"},"outputs":[{"output_type":"display_data","data":{"text/plain":["Downloading pytorch_model.bin: 0%| | 0.00/2.24G [00:00"],"text/html":["\n","
\n"," \n"," \n"," [477/477 05:30, Epoch 3/3]\n","
\n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n","
EpochTraining LossValidation Loss
1No log0.283688
2No log0.213056
3No log0.113657

"]},"metadata":{}},{"output_type":"execute_result","data":{"text/plain":["TrainOutput(global_step=477, training_loss=0.45255054018032626, metrics={'train_runtime': 332.0341, 'train_samples_per_second': 1.437, 'train_steps_per_second': 1.437, 'total_flos': 432610581294000.0, 'train_loss': 0.45255054018032626, 'epoch': 3.0})"]},"metadata":{},"execution_count":15}],"source":["trainer.train()"]},{"cell_type":"code","execution_count":null,"metadata":{"id":"01g-y3FmuFf2","colab":{"base_uri":"https://localhost:8080/","height":145,"referenced_widgets":["5ed29e3898214fe9a47f10158770a1ff","3a55e0ee4add4ccb917583769fea3946","5cd3839534fa4f0fbdcd8c7498c32e4f","f334d78dbf514ea5a8c877a1e8c7b1f7","597b5cbeb3ed4cf7a7adafd57a35b263","447139dec0dd4bf8abed222c589d276a","5f6d4b2a25404a598782227ff437fd0e","99ad4594d89144e4a3b8265446f1d203","1faac4932d1c451a8326e6c34ed5164a","772b3346877c4672b4d9310a28c4a6dc","10c35b59fd5e44d39871900c39d82648","fb2ddc1c6061401481385932104f27dc","08e1ee4d0cc049a581e22198dc6eca05","7e8ac63132984d248c1dde5ce566068a","3a287a61bee045868dadd9b57fd8e704","409ffb0c00c94678921e97196599f8d6","79a9425638fe42c2894f62ff8ee33859","d7c52c3c1f34474ea8377aab6ea915ad","81a48f18324042978e0950debc5a2af6","b2259b66f2a940689f2c21da2c52adfa","b8d9d855fc50423f8cc2935c429700c6","6b495106914247458e8c37618770e8e5","6fffd7d043a44a92b0fc2869b519e4da","6777c6ca16ce443f85967044d7970e9a","b97096dc88194654a7eb94283552d055","99557ce0e6914c37b0010f0a00ec78f4","a7cd4a1aeb52490dadcf2f077642950d","38bf8039d3514f6792b131a10b19f194","37f2287e955849589d2aa06af7e30257","f1c5e8ee4f894f2dbd8e5457d4ecea5c","e39c17d7322d45c98fab1dd818d90f21","ba5de6b05bfa4a958652a52129d3881e","df5d7dbf65cf4dcf89e95084ed656035","a42d99a9dcaa4788803466667ffe305d","51ded9df191548b7960c13ddcda71913","da3815597dbe40c593bda465ff73a33d","0a6e0733422543a8a8f777f3e73743e2","7775a5b43c1d463ca81a3994f6b530e8","10d4dd9e4f964a82ac49f199045071d7","dc1be0ad2dfd46729e8ae0ea5a7c1c94","966840088dd142e88aa0edf642eb1747","702186d341bc40b28e4abadd5abda574","9cb96e764d2b4a3b84afb54957dba92f","7461173a529a4470b98e2335720e86b9"]},"outputId":"c870ba77-425e-4f26-c7ce-af4d5ec42bba"},"outputs":[{"output_type":"display_data","data":{"text/plain":["training_args.bin: 0%| | 0.00/4.09k [00:00