diff --git "a/notebooks/qwen-3-0-6b-reasoning-vi-medical-lora.ipynb" "b/notebooks/qwen-3-0-6b-reasoning-vi-medical-lora.ipynb"
new file mode 100644--- /dev/null
+++ "b/notebooks/qwen-3-0-6b-reasoning-vi-medical-lora.ipynb"
@@ -0,0 +1,3513 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {
+    "_cell_guid": "b1076dfc-b9ad-4769-8c92-a6c4dae69d19",
+    "_uuid": "8f2839f25d086af736a60e9eeb907d3b93b6e0e5",
+    "execution": {
+     "iopub.execute_input": "2025-07-06T11:09:36.629664Z",
+     "iopub.status.busy": "2025-07-06T11:09:36.629419Z",
+     "iopub.status.idle": "2025-07-06T11:12:42.232385Z",
+     "shell.execute_reply": "2025-07-06T11:12:42.231459Z",
+     "shell.execute_reply.started": "2025-07-06T11:09:36.629644Z"
+    },
+    "trusted": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m46.9/46.9 kB\u001b[0m \u001b[31m1.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m294.5/294.5 kB\u001b[0m \u001b[31m7.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0mta \u001b[36m0:00:01\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m375.8/375.8 kB\u001b[0m \u001b[31m19.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m154.2/154.2 kB\u001b[0m \u001b[31m10.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m31.5/31.5 MB\u001b[0m \u001b[31m60.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m:00:01\u001b[0m00:01\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m865.2/865.2 MB\u001b[0m \u001b[31m2.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m0:00:01\u001b[0m00:01\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m156.5/156.5 MB\u001b[0m \u001b[31m7.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m0:00:01\u001b[0m00:01\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m393.1/393.1 MB\u001b[0m \u001b[31m4.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m0:00:01\u001b[0m00:01\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m8.9/8.9 MB\u001b[0m \u001b[31m5.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m0:00:01\u001b[0m00:01\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m23.7/23.7 MB\u001b[0m \u001b[31m6.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m0:00:01\u001b[0m00:01\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m897.7/897.7 kB\u001b[0m \u001b[31m43.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m571.0/571.0 MB\u001b[0m \u001b[31m3.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m0:00:01\u001b[0m00:01\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m200.2/200.2 MB\u001b[0m \u001b[31m8.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m0:00:01\u001b[0m00:01\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.1/1.1 MB\u001b[0m \u001b[31m45.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m56.3/56.3 MB\u001b[0m \u001b[31m31.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m:00:01\u001b[0m00:01\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m158.2/158.2 MB\u001b[0m \u001b[31m7.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m0:00:01\u001b[0m00:01\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m216.6/216.6 MB\u001b[0m \u001b[31m7.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m0:00:01\u001b[0m00:01\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m156.8/156.8 MB\u001b[0m \u001b[31m10.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m:00:01\u001b[0m00:01\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m201.3/201.3 MB\u001b[0m \u001b[31m1.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m0:00:01\u001b[0m00:01\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m19.7/19.7 MB\u001b[0m \u001b[31m12.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m:00:01\u001b[0m00:01\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m89.3/89.3 kB\u001b[0m \u001b[31m6.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m72.9/72.9 MB\u001b[0m \u001b[31m24.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m:00:01\u001b[0m00:01\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m7.4/7.4 MB\u001b[0m \u001b[31m100.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:01\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m129.0/129.0 kB\u001b[0m \u001b[31m9.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m193.6/193.6 kB\u001b[0m \u001b[31m13.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m6.3/6.3 MB\u001b[0m \u001b[31m101.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m\n",
+      "\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m210.7/210.7 kB\u001b[0m \u001b[31m15.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+      "\u001b[?25h\u001b[31mERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.\n",
+      "cesium 0.12.4 requires numpy<3.0,>=2.0, but you have numpy 1.26.4 which is incompatible.\n",
+      "torchaudio 2.6.0+cu124 requires torch==2.6.0, but you have torch 2.7.0 which is incompatible.\n",
+      "bigframes 1.42.0 requires rich<14,>=12.4.4, but you have rich 14.0.0 which is incompatible.\n",
+      "gcsfs 2025.3.2 requires fsspec==2025.3.2, but you have fsspec 2025.3.0 which is incompatible.\n",
+      "fastai 2.7.19 requires torch<2.7,>=1.10, but you have torch 2.7.0 which is incompatible.\u001b[0m\u001b[31m\n",
+      "\u001b[0m"
+     ]
+    }
+   ],
+   "source": [
+    "!pip install -q unsloth"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2025-07-05T08:11:04.100619Z",
+     "iopub.status.busy": "2025-07-05T08:11:04.100237Z",
+     "iopub.status.idle": "2025-07-05T08:11:34.999544Z",
+     "shell.execute_reply": "2025-07-05T08:11:34.998784Z",
+     "shell.execute_reply.started": "2025-07-05T08:11:04.100592Z"
+    },
+    "trusted": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "🦥 Unsloth: Will patch your computer to enable 2x faster free finetuning.\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "2025-07-05 08:11:15.174279: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:477] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered\n",
+      "WARNING: All log messages before absl::InitializeLog() is called are written to STDERR\n",
+      "E0000 00:00:1751703075.342853      35 cuda_dnn.cc:8310] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered\n",
+      "E0000 00:00:1751703075.461285      35 cuda_blas.cc:1418] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "🦥 Unsloth Zoo will now patch everything to make training faster!\n",
+      "datasets.__version__ 3.6.0\n",
+      "numpy.__version__ 1.26.4\n",
+      "unsloth.__version__ 2025.6.12\n",
+      "torch.__version__ 2.7.0+cu126\n",
+      "transformers.__version__ 4.51.3\n",
+      "trl.__version__ 0.19.0\n"
+     ]
+    }
+   ],
+   "source": [
+    "import datasets\n",
+    "import numpy as np\n",
+    "import unsloth\n",
+    "import torch\n",
+    "import trl \n",
+    "import transformers\n",
+    "import unsloth\n",
+    "\n",
+    "print(\"datasets.__version__\", datasets.__version__)\n",
+    "print(\"numpy.__version__\", np.__version__)\n",
+    "print(\"unsloth.__version__\", unsloth.__version__)\n",
+    "print(\"torch.__version__\", torch.__version__)\n",
+    "print(\"transformers.__version__\", transformers.__version__)\n",
+    "print(\"trl.__version__\", trl.__version__)\n",
+    "\n",
+    "# datasets.__version__ 3.6.0\n",
+    "# numpy.__version__ 1.26.4\n",
+    "# unsloth.__version__ 2025.6.3\n",
+    "# torch.__version__ 2.7.0+cu126\n",
+    "# transformers.__version__ 4.51.3\n",
+    "# trl.__version__ 0.19.0"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2025-07-06T11:12:42.234163Z",
+     "iopub.status.busy": "2025-07-06T11:12:42.233893Z",
+     "iopub.status.idle": "2025-07-06T11:12:58.668872Z",
+     "shell.execute_reply": "2025-07-06T11:12:58.668079Z",
+     "shell.execute_reply.started": "2025-07-06T11:12:42.234140Z"
+    },
+    "trusted": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "b3b5ba312a6b4a3d81250785bf465432",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Fetching 182 files:   0%|          | 0/182 [00:00<?, ?it/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "283e0d3f9ef944f9a3decb3d4cfa417d",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_model.safetensors:   0%|          | 0.00/40.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "1d7c5669da574e63a6392ebf49271ebc",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "added_tokens.json:   0%|          | 0.00/707 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "880b720a876d4369bfbfe4801b7fa974",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_config.json:   0%|          | 0.00/806 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "3dfe1bf4f98d443fbf419428c793b34c",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "optimizer.pt:   0%|          | 0.00/21.0M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "a1f3332a5878466b97a9d4719594852c",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "merges.txt: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "8a37b523008145eb98d9236cedfbe724",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       ".gitattributes: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "40c873ce24d84b539ff1ab29dd09ae6f",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "README.md: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "74d929c26e29442bbd03b194f17d756a",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "README.md: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "7d5713994f244b6bb3d09b0c2732a1fc",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scaler.pt:   0%|          | 0.00/1.38k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "3dd307a455934b9e9e1f2f2da1f02b49",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scheduler.pt:   0%|          | 0.00/1.47k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "0b8618e92b254e55b05d82ba1bc296c2",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer.json:   0%|          | 0.00/11.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "ca18b907d121469b8f61c96d9479589c",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "rng_state.pth:   0%|          | 0.00/14.6k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "75f403ce0a98466881327dcd2763e6c3",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "trainer_state.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "0ed72b2ddbfa432498d3e2383e188c9c",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "training_args.bin:   0%|          | 0.00/6.16k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "51cd0b1872a248588a28afd55680cd09",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer_config.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "0a610499c8b647f9a53d921febd9ee2c",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "vocab.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "3f897b0a595a465c977cc40ec973abc8",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "special_tokens_map.json:   0%|          | 0.00/614 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "7cd59a70262843c6a7c8b74a4a9afba2",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "README.md: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "c3e98d59c6e94095a26065a735673386",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_model.safetensors:   0%|          | 0.00/40.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "b221d7136c95495782a03d16e367bc00",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_config.json:   0%|          | 0.00/806 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "188dd4d9868445439088a85add7e1b6d",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "added_tokens.json:   0%|          | 0.00/707 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "a5d6f33abc6742b783547fd7f51ec1f3",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "optimizer.pt:   0%|          | 0.00/21.0M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "68c1bc672e6a492399bcb23d2a312b07",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "rng_state.pth:   0%|          | 0.00/14.6k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "6b30c3ebba3a4122a2843326c6e8bf00",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "merges.txt: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "d0df1b586367488894d1fea1f304ac81",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer.json:   0%|          | 0.00/11.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "b9989bdbb0d6406097eda38d36a5f1be",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "special_tokens_map.json:   0%|          | 0.00/614 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "ea39317b0e5640fdb99105ecbcd55aba",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scaler.pt:   0%|          | 0.00/1.38k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "c8f699ded6134a86bc466bc209034819",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scheduler.pt:   0%|          | 0.00/1.47k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "14c89daf51a847c592c760de6563adfa",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "training_args.bin:   0%|          | 0.00/6.16k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "6881fd59fcd542dc865d19f81d549ef6",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer_config.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "968ae1bac1f64a9788ca069c8c47df02",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "trainer_state.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "4ff85f80b4f345c985e01ad678bb242d",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_model.safetensors:   0%|          | 0.00/40.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "5f0993fd5b3141038d41c9fe410a120c",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "vocab.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "4fed345408b54d0e9c2caec7162b40f0",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "README.md: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "4b382627e8b04f23985d4c571d860271",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_config.json:   0%|          | 0.00/806 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "63e539b42d09464abbba9f54a4e6fb19",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "added_tokens.json:   0%|          | 0.00/707 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "dbaad8a079134f0fb965614246044f26",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "merges.txt: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "3975fa0e01af46f7844fae83c0a32b42",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "rng_state.pth:   0%|          | 0.00/14.6k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "3ca467cdfd034378b72fa2ee0accc8e7",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer.json:   0%|          | 0.00/11.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "782980e035544c46b9d377265537fc2e",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "optimizer.pt:   0%|          | 0.00/21.0M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "46aa7d878dc2422093d2181f3f5ec317",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scaler.pt:   0%|          | 0.00/1.38k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "a5341586c09c4039be1c3e92b7b9364a",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scheduler.pt:   0%|          | 0.00/1.47k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "af69e81d1a0a496fbc64e9e92a61bd07",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "training_args.bin:   0%|          | 0.00/6.16k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "9b84748c04824ee8b84d4488337c0816",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "special_tokens_map.json:   0%|          | 0.00/614 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "276bcc5f9a8c4b4fae5ba25f9dd741f9",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer_config.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "5c5917e15bbd43f8a24e1be4b9dafce9",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "trainer_state.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "614bde77777d403cb6b357587cfeb8e0",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "vocab.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "69de5f3586bd454e804c7ffac5fe4eca",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_model.safetensors:   0%|          | 0.00/40.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "ae987d1e7a8648808793f7f2047bd69d",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "README.md: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "edf3d24b45e8488882f9042bbd6e7de7",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_config.json:   0%|          | 0.00/806 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "0db9d3330e9641a4b765c754c3f98320",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "rng_state.pth:   0%|          | 0.00/14.6k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "7110b6ffec214ced8485c7cb8eea12b6",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "optimizer.pt:   0%|          | 0.00/21.0M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "75fb51d2fd254aebb9d6eef1c1580e41",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "added_tokens.json:   0%|          | 0.00/707 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "cab1457634bb4fa68dc97f880632a805",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "merges.txt: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "2b821ef882d444f0855f935202ca55f8",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer.json:   0%|          | 0.00/11.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "b998cc0c41c2491e94ea6ddaa6bd86b9",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scaler.pt:   0%|          | 0.00/1.38k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "87caa0a34b9e4e57b84760b992fb8b4a",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scheduler.pt:   0%|          | 0.00/1.47k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "9ab3712ab9bf4b6f9c708362fca452de",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "training_args.bin:   0%|          | 0.00/6.16k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "1dce96fc6f8e4babb307f332cb03ce36",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "special_tokens_map.json:   0%|          | 0.00/614 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "55f8b9d867814ba8919bdf93fe960ec8",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer_config.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "cdfe2373754742caa64d67980f31c880",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "trainer_state.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "40e665281ebe48eaab5bd3a294b23147",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "vocab.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "b5491c5f2ce24412a0e240a49b4fe992",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "README.md: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "1a1cd985e8c54fb2914281b3862fcd42",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_model.safetensors:   0%|          | 0.00/40.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "addb81f89575426a87d9d95e55fa7116",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_config.json:   0%|          | 0.00/806 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "a8b7eda77cc0420cbaabd0f5edfdadd9",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "optimizer.pt:   0%|          | 0.00/22.0M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "db6d42bca44142f9b44c3bdec217dee6",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "rng_state.pth:   0%|          | 0.00/14.6k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "b27e2c3deb794849876a9cb7fe5767eb",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "added_tokens.json:   0%|          | 0.00/707 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "a1bd5818d9314426b56c057849d22bbc",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scaler.pt:   0%|          | 0.00/1.38k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "3ad7313c260b43849f8f76541ddec42b",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scheduler.pt:   0%|          | 0.00/1.47k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "a04272a0df834bb2b8e92c4fde658b26",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "merges.txt: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "a6913712df9f4c859d2b771d83ffdd54",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer.json:   0%|          | 0.00/11.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "d5fb04a0edeb4f858e61aafe171058b3",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "special_tokens_map.json:   0%|          | 0.00/614 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "729b3c32c2a64f57bfd4d0481c885bb5",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "training_args.bin:   0%|          | 0.00/6.16k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "183c646691d64a70b6c17e9260bfcc20",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "trainer_state.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "d89dbf9e62d547178c0172f8099e7ca7",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer_config.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "3f1c8fa10742493b886f270d67e9c67d",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "vocab.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "90515c7c0fd445b08f2ff863c4213b28",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "README.md: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "c09c29b717ec4799b50c83870ea3a045",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_model.safetensors:   0%|          | 0.00/40.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "9044bec11e1c4421ba11573b949dd378",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_config.json:   0%|          | 0.00/806 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "182e69639a7d40d39c71ce113fa3fda2",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "optimizer.pt:   0%|          | 0.00/22.0M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "53789c4c4b1f4c6e8059ab81514f6e93",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "added_tokens.json:   0%|          | 0.00/707 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "a816bee369604c11ba753636145bc001",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scheduler.pt:   0%|          | 0.00/1.47k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "8be4be2a6d534044a0fee93b9b5a7bf7",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "merges.txt: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "8d7a3b1fb07847e7b654c522d982d17a",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scaler.pt:   0%|          | 0.00/1.38k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "3ea5787051ac4d7daca4f0912d4a6946",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer.json:   0%|          | 0.00/11.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "622c41eab7504509ab37dc892eb814db",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "training_args.bin:   0%|          | 0.00/6.16k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "aa92980f99564e2e82bdd6bb4c1e7159",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "rng_state.pth:   0%|          | 0.00/14.6k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "fe99863368274ca79fc4ba49f8e78183",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "special_tokens_map.json:   0%|          | 0.00/614 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "9c89907808664566948c5f5da609a471",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer_config.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "59103e1d337748388898305495e55abf",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "trainer_state.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "4ccdde61a96d437c9fd0c2d7f85b9e75",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "vocab.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "bffdf0fd93ae4b7ba122dac93b114e12",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_model.safetensors:   0%|          | 0.00/40.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "1590d49b70ab4e8b9f26eb601a145fed",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "README.md: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "8ce491ab849349b3845608faeecdf2ab",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_config.json:   0%|          | 0.00/806 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "409b075e1ce4451eac88b1295aba63a2",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "added_tokens.json:   0%|          | 0.00/707 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "cca612cc17d9453482685fe63db01088",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "optimizer.pt:   0%|          | 0.00/22.0M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "454d4b4023d24328bff76098e8cfefa0",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "merges.txt: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "74f09a1370ce42ed873b906bf8fffbe7",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "rng_state.pth:   0%|          | 0.00/14.6k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "477950fa11bf4474bfbb928533224e28",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer.json:   0%|          | 0.00/11.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "0ea9ae00d90345258df9a6f887d6565a",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scaler.pt:   0%|          | 0.00/1.38k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "dc24f98a8e244e18b909438c470f1c98",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scheduler.pt:   0%|          | 0.00/1.47k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "dc51b2519a0846cc8054644c2f094018",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "training_args.bin:   0%|          | 0.00/6.16k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "de27b175cfa94d93964427f9f916aab7",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "special_tokens_map.json:   0%|          | 0.00/614 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "e4039bb6c5494a94a4e7c84034efc0f4",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer_config.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "3755a6830b3c405ba45cd92c02092fa5",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "trainer_state.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "406d1c4e2d5a46c390bacc024858d541",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "README.md: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "d4a188fdf90b4d529c57458dd56acc41",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "vocab.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "c70040ac768245129a576310d16d8840",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_model.safetensors:   0%|          | 0.00/40.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "d2d82654506644429119c28f0c7bd9bd",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "rng_state.pth:   0%|          | 0.00/14.6k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "129a8b2e3cd5487291e899c09e8b24af",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_config.json:   0%|          | 0.00/806 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "ef23e4ebd64e4a22bb63fc7c2c4dadcf",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "optimizer.pt:   0%|          | 0.00/22.0M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "307ec0ffd422475abce72f4a973a584e",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "added_tokens.json:   0%|          | 0.00/707 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "74caf75f75c74d02b60c2774ab781cf6",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scaler.pt:   0%|          | 0.00/1.38k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "5420a043b4574d03b750334efd6585ad",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "merges.txt: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "cca1ae734a3f445f872523caffef1a61",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer.json:   0%|          | 0.00/11.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "b80e7585b4224dafbe813ea30da5fb2f",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scheduler.pt:   0%|          | 0.00/1.47k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "58da79fa17ee4dc7837ca20c4c23509f",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "training_args.bin:   0%|          | 0.00/6.16k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "bf4f2e0ead264994b3e193f60d242d10",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "special_tokens_map.json:   0%|          | 0.00/614 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "e1640febaafd4fdd82b22dd979edd52c",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer_config.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "516c1d21ed4e42ba8646616615c65a3f",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "vocab.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "8a335cea6e794d6ebb91be8a637dd44f",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "README.md: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "ab75642e79f44856bb96db77baa0858d",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_model.safetensors:   0%|          | 0.00/40.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "7a9f37f3159841539f6995345a3d123b",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_config.json:   0%|          | 0.00/806 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "6c4b8811071641539673069d0425ea82",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "trainer_state.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "ec139eaccc4d4d63ac84d0e320136240",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "added_tokens.json:   0%|          | 0.00/707 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "4afa8debfe574dbcb434940d133e239b",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "optimizer.pt:   0%|          | 0.00/22.0M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "788927bb2c564715950242fb83e4bf34",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "rng_state.pth:   0%|          | 0.00/14.6k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "5ed3777b2cc345ecba0b0bff59185f23",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scheduler.pt:   0%|          | 0.00/1.47k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "0af5a1422d9c44d086753c401edc7f58",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer.json:   0%|          | 0.00/11.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "f60779ccb7ac42b8bf8ef98d1f6e617f",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "merges.txt: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "0dfc18807d584d0bb52c5028ceeba579",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scaler.pt:   0%|          | 0.00/1.38k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "973aefa9421c4b86be931fddb89b4e6b",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "special_tokens_map.json:   0%|          | 0.00/614 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "02058bbf32c041e49a0906e592ebfb3b",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "training_args.bin:   0%|          | 0.00/6.16k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "53250a37124240a09fcdaa69352b74e0",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer_config.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "b8da79a001004de19104b0939f438c37",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "trainer_state.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "452a6b47d5e74aafbf7e5327331e7c47",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "vocab.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "0b2c0234f8b74523b7cd5f1e4dc505f5",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_model.safetensors:   0%|          | 0.00/40.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "7e81af3972684d5aba2d74d62cbfe7cb",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_config.json:   0%|          | 0.00/806 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "bbacffc1be8d43908488c4dff7263854",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "optimizer.pt:   0%|          | 0.00/22.0M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "c00103e3c3ac4beea5aefe5e3fd9f764",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "README.md: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "afa9e793d7e14207baaffeabe7717ebc",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "added_tokens.json:   0%|          | 0.00/707 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "406ba94117b24ddb9548aca62a00e7ce",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "merges.txt: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "b3b6332a1bc54a47acb94833f1f45067",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "rng_state.pth:   0%|          | 0.00/14.6k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "3b23910c375c4ceb8a2996f2737051bf",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scaler.pt:   0%|          | 0.00/1.38k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "772b7ac34eab46eca4c813df39fe4c7d",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer.json:   0%|          | 0.00/11.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "858159f917544403a3ee454d1cb70b76",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scheduler.pt:   0%|          | 0.00/1.47k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "b4243f1dcf5b43e287394e83cf65ae55",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "training_args.bin:   0%|          | 0.00/6.16k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "ec3d270e689f4982b358a3ce98fea6fe",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "special_tokens_map.json:   0%|          | 0.00/614 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "22264c670371497d98ea00f7f8b81bde",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer_config.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "8f9e7f5ff0934a21a1048f03a0be88e8",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "trainer_state.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "d3163d6efa354c13829a35474f6b1baf",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "vocab.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "7e147d857c2644319ad1aa9412003160",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_model.safetensors:   0%|          | 0.00/40.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "c5164beb69ae4ef7b1ac53599d76f4b7",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "README.md: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "fa640ac0325e4fb89be14866e20cae5b",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_config.json:   0%|          | 0.00/806 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "f6637f2ab0f64f71abf6fa329c85fd54",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "added_tokens.json:   0%|          | 0.00/707 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "f23dc0e4c7264603a78a379a8fd169b5",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "optimizer.pt:   0%|          | 0.00/22.0M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "aa2b8318ef2c440a9ba3fcb9ed396d27",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "rng_state.pth:   0%|          | 0.00/14.6k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "da3f308b9fdc41f1bf65bf30d43738d1",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scaler.pt:   0%|          | 0.00/1.38k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "5fbfeb9914534aacad63237dcb34c75c",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer.json:   0%|          | 0.00/11.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "324402d4b8124ba0aa2ed0024e4c4eb8",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scheduler.pt:   0%|          | 0.00/1.47k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "96d5cc588f3a47a781d05334c734c863",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "merges.txt: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "f1852a88034247849f40df239a134eb3",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "special_tokens_map.json:   0%|          | 0.00/614 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "10bf431456564a1c9312ebcc14cfcce1",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "training_args.bin:   0%|          | 0.00/6.16k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "7a63979ab8e649cda861fd72fbc92700",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer_config.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "43b5a5901ecf4ec48719baaacb5345c2",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "trainer_state.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "1551bf8878d745138bdfaaa89a40353b",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "vocab.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "2d77b860eca849858aee7489d77f8d89",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_model.safetensors:   0%|          | 0.00/40.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "5274cc5fc98f49608772634c38af70c3",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "README.md: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "f1554e3def9f451482c4191319e1c35d",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "adapter_config.json:   0%|          | 0.00/806 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "c5ad9cec72d64770826db1c200216fd8",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "added_tokens.json:   0%|          | 0.00/707 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "d4d067d726584cf28129a7fdff2d91f4",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "optimizer.pt:   0%|          | 0.00/22.0M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "c69f6cb6298e44c8b08cd526e881b1f3",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "rng_state.pth:   0%|          | 0.00/14.6k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "4d83608d555a4adb87b3d5b70b3a3c70",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "merges.txt: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "5401a2962d604b978f4c42c59b160ff2",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scaler.pt:   0%|          | 0.00/1.38k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "72a1d9bc8a2a41bb84b4e64ab1b3626d",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer.json:   0%|          | 0.00/11.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "721d4753e1ce4b46899f12158fc107db",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "scheduler.pt:   0%|          | 0.00/1.47k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "dad43ab0186245b495648c50374e8e8c",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "training_args.bin:   0%|          | 0.00/6.16k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "22bc7d17bca14beaa32a3e5f94007577",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "special_tokens_map.json:   0%|          | 0.00/614 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "945e6d00aea541c6a0703bbceaaf1826",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer_config.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "60627a44be39421ab9e85535d5aa9256",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "trainer_state.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "596e1a9d6567410cb6e6f035247cea7b",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "vocab.json: 0.00B [00:00, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "text/plain": [
+       "'/kaggle/working/Qwen-3-0.6B-Reasoning-Vi-Medical-LoRA'"
+      ]
+     },
+     "execution_count": 2,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from huggingface_hub import HfApi\n",
+    "from huggingface_hub import snapshot_download\n",
+    "import os\n",
+    "api = HfApi()\n",
+    "\n",
+    "repo_id = \"danhtran2mind/Qwen-3-0.6B-Reasoning-Vi-Medical-LoRA\"\n",
+    "save_path = \"./Qwen-3-0.6B-Reasoning-Vi-Medical-LoRA\"\n",
+    "\n",
+    "# Create the directory if it doesn't exist\n",
+    "os.makedirs(save_path, exist_ok=True)\n",
+    "\n",
+    "# Download the dataset\n",
+    "snapshot_download(repo_id=repo_id, repo_type=\"model\", local_dir=save_path)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "trusted": true
+   },
+   "outputs": [],
+   "source": [
+    "# To temporary Model hub\n",
+    "from huggingface_hub import HfApi\n",
+    "from huggingface_hub import login\n",
+    "# Initialize API\n",
+    "login(\"<your_huggingface_token>\")\n",
+    "api = HfApi()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2025-07-06T11:12:58.670012Z",
+     "iopub.status.busy": "2025-07-06T11:12:58.669729Z",
+     "iopub.status.idle": "2025-07-06T11:13:30.782470Z",
+     "shell.execute_reply": "2025-07-06T11:13:30.781929Z",
+     "shell.execute_reply.started": "2025-07-06T11:12:58.669988Z"
+    },
+    "trusted": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "🦥 Unsloth: Will patch your computer to enable 2x faster free finetuning.\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "2025-07-06 11:13:10.169046: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:477] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered\n",
+      "WARNING: All log messages before absl::InitializeLog() is called are written to STDERR\n",
+      "E0000 00:00:1751800390.435353      35 cuda_dnn.cc:8310] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered\n",
+      "E0000 00:00:1751800390.493002      35 cuda_blas.cc:1418] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "🦥 Unsloth Zoo will now patch everything to make training faster!\n"
+     ]
+    }
+   ],
+   "source": [
+    "import numpy as np\n",
+    "from datasets import concatenate_datasets, load_dataset\n",
+    "\n",
+    "from unsloth import FastLanguageModel\n",
+    "from unsloth import is_bfloat16_supported\n",
+    "from unsloth.chat_templates import train_on_responses_only  \n",
+    "import torch\n",
+    "\n",
+    "from trl import SFTTrainer\n",
+    "from transformers import TrainingArguments, DataCollatorForSeq2Seq"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2025-07-06T11:17:13.817972Z",
+     "iopub.status.busy": "2025-07-06T11:17:13.817246Z",
+     "iopub.status.idle": "2025-07-06T11:17:35.429882Z",
+     "shell.execute_reply": "2025-07-06T11:17:35.429104Z",
+     "shell.execute_reply.started": "2025-07-06T11:17:13.817938Z"
+    },
+    "trusted": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "==((====))==  Unsloth 2025.6.12: Fast Qwen3 patching. Transformers: 4.51.3.\n",
+      "   \\\\   /|    Tesla P100-PCIE-16GB. Num GPUs = 1. Max memory: 15.888 GB. Platform: Linux.\n",
+      "O^O/ \\_/ \\    Torch: 2.7.0+cu126. CUDA: 6.0. CUDA Toolkit: 12.6. Triton: 3.3.0\n",
+      "\\        /    Bfloat16 = FALSE. FA [Xformers = 0.0.30. FA2 = False]\n",
+      " \"-____-\"     Free license: http://github.com/unslothai/unsloth\n",
+      "Unsloth: Fast downloading is enabled - ignore downloading bars which are red colored!\n"
+     ]
+    }
+   ],
+   "source": [
+    "model, tokenizer = FastLanguageModel.from_pretrained(\n",
+    "    model_name = \"Qwen/Qwen3-0.6B\",\n",
+    "    max_seq_length = 2048,   # Context length - can be longer, but uses more memory\n",
+    "    load_in_4bit = True,     # 4bit uses much less memory\n",
+    "    load_in_8bit = False,    # A bit more accurate, uses 2x memory\n",
+    "    full_finetuning = False, # We have full finetuning now!\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2025-07-06T11:17:44.514487Z",
+     "iopub.status.busy": "2025-07-06T11:17:44.513913Z",
+     "iopub.status.idle": "2025-07-06T11:17:51.099758Z",
+     "shell.execute_reply": "2025-07-06T11:17:51.098951Z",
+     "shell.execute_reply.started": "2025-07-06T11:17:44.514462Z"
+    },
+    "trusted": true
+   },
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Unsloth 2025.6.12 patched 28 layers with 28 QKV layers, 28 O layers and 28 MLP layers.\n"
+     ]
+    }
+   ],
+   "source": [
+    "model = FastLanguageModel.get_peft_model(  \n",
+    "    model,  \n",
+    "    r=16,  \n",
+    "    target_modules=[\"q_proj\", \"k_proj\", \"v_proj\", \"o_proj\",  \n",
+    "                    \"gate_proj\", \"up_proj\", \"down_proj\"],  \n",
+    "    lora_alpha=16,  \n",
+    "    lora_dropout=0,  \n",
+    "    bias=\"none\",  \n",
+    "    use_gradient_checkpointing=\"unsloth\",  \n",
+    "    random_state=42,  \n",
+    "    use_rslora=False,  \n",
+    "    loftq_config=None\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Data Preparetation"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2025-07-06T11:17:51.101392Z",
+     "iopub.status.busy": "2025-07-06T11:17:51.101134Z",
+     "iopub.status.idle": "2025-07-06T11:17:51.105420Z",
+     "shell.execute_reply": "2025-07-06T11:17:51.104831Z",
+     "shell.execute_reply.started": "2025-07-06T11:17:51.101373Z"
+    },
+    "trusted": true
+   },
+   "outputs": [],
+   "source": [
+    "train_prompt_style = \"\"\"Bên dưới là một hướng dẫn mô tả nhiệm vụ, đi kèm với thông tin đầu vào để cung cấp thêm ngữ cảnh.\n",
+    "Hãy viết một phản hồi hoàn thành yêu cầu một cách phù hợp.\n",
+    "Trước khi trả lời, hãy suy nghĩ cẩn thận về câu hỏi và tạo ra một chuỗi suy nghĩ từng bước để đảm bảo một phản hồi logic và chính xác.\n",
+    "\n",
+    "### Instruction:\n",
+    "Bạn là một chuyên gia y khoa với kiến thức chuyên sâu về lập luận lâm sàng, chẩn đoán và lập kế hoạch điều trị.\n",
+    "Vui lòng trả lời câu hỏi y khoa sau đây.\n",
+    "\n",
+    "### Question:\n",
+    "{}\n",
+    "\n",
+    "### Response:\n",
+    "<think>\n",
+    "{}\n",
+    "</think>\n",
+    "{}\"\"\""
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2025-07-06T11:17:51.106342Z",
+     "iopub.status.busy": "2025-07-06T11:17:51.106128Z",
+     "iopub.status.idle": "2025-07-06T11:17:51.121509Z",
+     "shell.execute_reply": "2025-07-06T11:17:51.120908Z",
+     "shell.execute_reply.started": "2025-07-06T11:17:51.106327Z"
+    },
+    "trusted": true
+   },
+   "outputs": [],
+   "source": [
+    "# EOS_TOKEN = tokenizer.eos_token  # Must add EOS_TOKEN\n",
+    "\n",
+    "def formatting_prompts_func(examples):\n",
+    "    inputs = examples[\"question\"]\n",
+    "    complex_cots = examples[\"context\"]\n",
+    "    outputs = examples[\"answer\"]\n",
+    "    texts = []\n",
+    "    for question, cot, response in zip(inputs, complex_cots, outputs):\n",
+    "        # Append the EOS token to the response if it's not already there\n",
+    "        if not response.endswith(tokenizer.eos_token):\n",
+    "            response += tokenizer.eos_token\n",
+    "        text = train_prompt_style.format(question, cot, response)\n",
+    "        texts.append(text)\n",
+    "    return {\"text\": texts}"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2025-07-06T11:17:51.122972Z",
+     "iopub.status.busy": "2025-07-06T11:17:51.122759Z",
+     "iopub.status.idle": "2025-07-06T11:17:58.327195Z",
+     "shell.execute_reply": "2025-07-06T11:17:58.326516Z",
+     "shell.execute_reply.started": "2025-07-06T11:17:51.122951Z"
+    },
+    "trusted": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "7a411b6f59824d8eb23e58c0fad8f6fa",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Generating train split:   0%|          | 0/14121 [00:00<?, ? examples/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "284c136a6b50451a9bdd86aba6ebd710",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Generating test split:   0%|          | 0/785 [00:00<?, ? examples/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "1710ddf5daa24ee38df3b4a52bf82140",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Generating validation split:   0%|          | 0/784 [00:00<?, ? examples/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "9b9b5267d2c24fb78e7935ef57e8182a",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Map:   0%|          | 0/14121 [00:00<?, ? examples/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "53ee3de372c140efb717e0a3cc56f0d4",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Map:   0%|          | 0/785 [00:00<?, ? examples/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "1fbc4a3474f84ae294f31ca27904fd4d",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Map:   0%|          | 0/784 [00:00<?, ? examples/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "from datasets import load_dataset\n",
+    "\n",
+    "dataset = load_dataset(\n",
+    "    \"tmnam20/ViMedAQA\",\n",
+    "    \"disease\",\n",
+    "    trust_remote_code=True,\n",
+    ")\n",
+    "dataset = dataset.map(\n",
+    "    formatting_prompts_func,\n",
+    "    batched=True,\n",
+    ")\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2025-07-06T11:17:58.328879Z",
+     "iopub.status.busy": "2025-07-06T11:17:58.328589Z",
+     "iopub.status.idle": "2025-07-06T11:17:58.344766Z",
+     "shell.execute_reply": "2025-07-06T11:17:58.344220Z",
+     "shell.execute_reply.started": "2025-07-06T11:17:58.328862Z"
+    },
+    "trusted": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Number of training samples: 14121\n",
+      "Number of test samples: 1569\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Columns to keep\n",
+    "columns_to_keep = ['question', 'answer', 'context', 'text']\n",
+    "\n",
+    "# Columns to remove (all columns except the ones to keep)\n",
+    "columns_to_remove = [col for col in dataset['train'].column_names if col not in columns_to_keep]\n",
+    "\n",
+    "# Remove unwanted columns from each split\n",
+    "for split in dataset.keys():\n",
+    "    dataset[split] = dataset[split].remove_columns(columns_to_remove)\n",
+    "# Merge training and validation samples\n",
+    "test_samples = concatenate_datasets([dataset['validation'],\n",
+    "                                         dataset['test']])\n",
+    "\n",
+    "# Shuffle the merged dataset with a fixed random seed\n",
+    "training_samples = dataset['train']\n",
+    "test_samples = test_samples.shuffle(seed=42)\n",
+    "\n",
+    "print(\"Number of training samples:\", training_samples.num_rows)\n",
+    "print(\"Number of test samples:\", test_samples.num_rows)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2025-07-06T11:17:58.345464Z",
+     "iopub.status.busy": "2025-07-06T11:17:58.345283Z",
+     "iopub.status.idle": "2025-07-06T11:17:58.474933Z",
+     "shell.execute_reply": "2025-07-06T11:17:58.474213Z",
+     "shell.execute_reply.started": "2025-07-06T11:17:58.345444Z"
+    },
+    "trusted": true
+   },
+   "outputs": [],
+   "source": [
+    "from transformers import DataCollatorForLanguageModeling\n",
+    "\n",
+    "data_collator = DataCollatorForLanguageModeling(\n",
+    "    tokenizer=tokenizer,\n",
+    "    mlm=False\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2025-07-06T11:17:58.476589Z",
+     "iopub.status.busy": "2025-07-06T11:17:58.476383Z",
+     "iopub.status.idle": "2025-07-06T11:17:58.490214Z",
+     "shell.execute_reply": "2025-07-06T11:17:58.489508Z",
+     "shell.execute_reply.started": "2025-07-06T11:17:58.476574Z"
+    },
+    "trusted": true
+   },
+   "outputs": [],
+   "source": [
+    "inference_prompt_style = \"\"\"Bên dưới là một hướng dẫn mô tả một tác vụ, đi kèm với một thông tin đầu vào để cung cấp thêm ngữ cảnh.\n",
+    "Hãy viết một phản hồi để hoàn thành yêu cầu một cách phù hợp.\n",
+    "Trước khi trả lời, hãy suy nghĩ cẩn thận về câu hỏi và tạo một chuỗi suy nghĩ từng bước để đảm bảo phản hồi logic và chính xác.\n",
+    "\n",
+    "### Instruction:\n",
+    "Bạn là một chuyên gia y tế có kiến thức chuyên sâu về lập luận lâm sàng, chẩn đoán và lập kế hoạch điều trị.\n",
+    "Vui lòng trả lời câu hỏi y tế sau đây.\n",
+    "\n",
+    "### Question:\n",
+    "{}\n",
+    "\n",
+    "### Response:\n",
+    "<think>\n",
+    "\n",
+    "\"\"\"\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 14,
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2025-07-06T11:17:58.645858Z",
+     "iopub.status.busy": "2025-07-06T11:17:58.645605Z",
+     "iopub.status.idle": "2025-07-06T11:18:18.621520Z",
+     "shell.execute_reply": "2025-07-06T11:18:18.620888Z",
+     "shell.execute_reply.started": "2025-07-06T11:17:58.645841Z"
+    },
+    "trusted": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "<think>\n",
+      "\n",
+      "\n",
+      "</think>\n",
+      "\n",
+      "Suy nghĩ từng bước:\n",
+      "\n",
+      "1. **Xác định nguyên nhân**: Gout là một bệnh lý về đường dỷ hóa, liên quan đến quá trình tạo thành đường. Nguyên nhân chính là sự thay đổi trong lượng đường trong cơ thể, đặc biệt là sau khi tiêu hóa đường. Điều này dẫn đến các phản ứng tăng đường huyết, có thể gây ra các vấn đề như gout.\n",
+      "\n",
+      "2. **Cấu trúc cơ bản**: Gout xảy ra khi đường huyết tăng cao, dẫn đến sự phân chia của đường trong cơ thể. Điều này thường xảy ra do đường bị tiêu hóa, có thể do thiếu vitamin B12, vitamin B1, hoặc do đường huyết cao.\n",
+      "\n",
+      "3. **Sự khác biệt về tỷ lệ**: Nam giới có nguy cơ cao hơn phụ nữ trong việc kiểm soát và điều trị bệnh gout, đặc biệt là sau khi tiêu hóa đường. Điều này có thể do nam giới thường xuyên thay đổi đường trong cơ thể, dẫn đến tình trạng tăng đường huyết.\n",
+      "\n",
+      "4. **Bệnh lý y tế**: Gout là một bệnh lý đơn giản, có thể được điều trị bằng cách kiểm soát đường huyết, bổ sung vitamin B12, và điều chỉnh chế độ ăn. Do đó, việc lâm sàng thường xuyên kiểm tra và điều trị phù hợp là cần thiết.\n",
+      "\n",
+      "Vậy phản hồi: Nam giới có nguy cơ mắc bệnh gout cao hơn phụ nữ vì cơ thể thường xuyên thay đổi lượng đường, dẫn đến tình trạng tăng đường huyết. Điều này có thể ảnh hưởng đến khả năng kiểm soát bệnh và cần được điều trị kịp thời.\n"
+     ]
+    }
+   ],
+   "source": [
+    "question = training_samples[10]['question']\n",
+    "inputs = tokenizer(\n",
+    "    [inference_prompt_style.format(question) + tokenizer.eos_token],\n",
+    "    return_tensors=\"pt\"\n",
+    ").to(\"cuda\")\n",
+    "\n",
+    "outputs = model.generate(\n",
+    "    input_ids=inputs.input_ids,\n",
+    "    attention_mask=inputs.attention_mask,\n",
+    "    max_new_tokens=1200,\n",
+    "    eos_token_id=tokenizer.eos_token_id,\n",
+    "    use_cache=True,\n",
+    ")\n",
+    "response = tokenizer.batch_decode(outputs, skip_special_tokens=True)\n",
+    "print(response[0].split(\"### Response:\")[1])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 18,
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2025-07-06T11:20:30.194246Z",
+     "iopub.status.busy": "2025-07-06T11:20:30.193969Z",
+     "iopub.status.idle": "2025-07-06T11:20:30.221692Z",
+     "shell.execute_reply": "2025-07-06T11:20:30.221135Z",
+     "shell.execute_reply.started": "2025-07-06T11:20:30.194225Z"
+    },
+    "trusted": true
+   },
+   "outputs": [],
+   "source": [
+    "arguments = TrainingArguments(  \n",
+    "                resume_from_checkpoint=\"./Qwen-3-0.6B-Reasoning-Vi-Medical-LoRA\",\n",
+    "                per_device_train_batch_size=8,  \n",
+    "                per_device_eval_batch_size=8,  \n",
+    "                gradient_accumulation_steps=4,  \n",
+    "                eval_strategy=\"steps\",\n",
+    "                eval_steps=100,\n",
+    "                logging_steps=100,\n",
+    "                save_steps=100,\n",
+    "                warmup_steps=30,\n",
+    "                save_total_limit=4,\n",
+    "                num_train_epochs=17, # 5\n",
+    "                # max_steps=50,\n",
+    "                save_strategy=\"steps\",\n",
+    "                metric_for_best_model=\"eval_loss\",\n",
+    "                learning_rate=2e-4,  \n",
+    "                fp16=not is_bfloat16_supported(),  \n",
+    "                bf16=is_bfloat16_supported(),  \n",
+    "                optim=\"adamw_8bit\",  \n",
+    "                weight_decay=0.01,  \n",
+    "                lr_scheduler_type=\"linear\",  \n",
+    "                seed=42,  \n",
+    "                output_dir=\"./Qwen-3-0.6B-Reasoning-Vi-Medical-LoRA\",  \n",
+    "                report_to=\"none\",\n",
+    "                load_best_model_at_end=True,  # Load weights with lowest val loss\n",
+    "        \t\tgreater_is_better=False,\n",
+    "            )"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 19,
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2025-07-06T11:20:32.569180Z",
+     "iopub.status.busy": "2025-07-06T11:20:32.568905Z",
+     "iopub.status.idle": "2025-07-06T11:20:41.709986Z",
+     "shell.execute_reply": "2025-07-06T11:20:41.709391Z",
+     "shell.execute_reply.started": "2025-07-06T11:20:32.569161Z"
+    },
+    "trusted": true
+   },
+   "outputs": [
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "aeda8041da054066b08610037e1bbb13",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Unsloth: Tokenizing [\"text\"]:   0%|          | 0/14121 [00:00<?, ? examples/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "1906e0bb974c4ed4a0d3975d1f441bc7",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Unsloth: Tokenizing [\"text\"]:   0%|          | 0/1569 [00:00<?, ? examples/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "# Define Trainer\n",
+    "trainer = SFTTrainer(  \n",
+    "    model=model,  \n",
+    "    tokenizer=tokenizer,  \n",
+    "    train_dataset=training_samples,  \n",
+    "    eval_dataset=test_samples,  \n",
+    "    dataset_text_field=\"text\",\n",
+    "    max_seq_length=2048,  \n",
+    "    data_collator=DataCollatorForSeq2Seq(tokenizer=tokenizer),  \n",
+    "    dataset_num_proc=2,  \n",
+    "    packing=False,  # Can make training 5x faster for short sequences.  \n",
+    "    args=arguments\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2025-07-01T13:46:57.349739Z",
+     "iopub.status.busy": "2025-07-01T13:46:57.349513Z",
+     "iopub.status.idle": "2025-07-01T13:48:14.259335Z",
+     "shell.execute_reply": "2025-07-01T13:48:14.258227Z",
+     "shell.execute_reply.started": "2025-07-01T13:46:57.349713Z"
+    }
+   },
+   "source": [
+    "# Start train process\n",
+    "trainer_stats = trainer.train()#resume_from_checkpoint=True)\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2025-07-06T11:20:41.711435Z",
+     "iopub.status.busy": "2025-07-06T11:20:41.711208Z"
+    },
+    "trusted": true
+   },
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "==((====))==  Unsloth - 2x faster free finetuning | Num GPUs used = 1\n",
+      "   \\\\   /|    Num examples = 14,121 | Num Epochs = 17 | Total steps = 7,497\n",
+      "O^O/ \\_/ \\    Batch size per device = 8 | Gradient accumulation steps = 4\n",
+      "\\        /    Data Parallel GPUs = 1 | Total batch size (8 x 4 x 1) = 32\n",
+      " \"-____-\"     Trainable parameters = 10,092,544 of 600,000,000 (1.68% trained)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "\n",
+       "    <div>\n",
+       "      \n",
+       "      <progress value='6796' max='7497' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
+       "      [6796/7497 2:14:37 < 2:38:53, 0.07 it/s, Epoch 15.41/17]\n",
+       "    </div>\n",
+       "    <table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       " <tr style=\"text-align: left;\">\n",
+       "      <th>Step</th>\n",
+       "      <th>Training Loss</th>\n",
+       "      <th>Validation Loss</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <td>6300</td>\n",
+       "      <td>0.417100</td>\n",
+       "      <td>0.762564</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>6400</td>\n",
+       "      <td>0.426200</td>\n",
+       "      <td>0.757956</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>6500</td>\n",
+       "      <td>0.423000</td>\n",
+       "      <td>0.749194</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>6600</td>\n",
+       "      <td>0.421900</td>\n",
+       "      <td>0.744881</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>6700</td>\n",
+       "      <td>0.407700</td>\n",
+       "      <td>0.747354</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table><p>"
+      ],
+      "text/plain": [
+       "<IPython.core.display.HTML object>"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Unsloth: Not an error, but Qwen3ForCausalLM does not accept `num_items_in_batch`.\n",
+      "Using gradient accumulation will be very slightly less accurate.\n",
+      "Read more on gradient accumulation issues here: https://unsloth.ai/blog/gradient\n"
+     ]
+    }
+   ],
+   "source": [
+    "trainer.train(resume_from_checkpoint=True)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Inference"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 55,
+   "metadata": {
+    "execution": {
+     "iopub.execute_input": "2025-07-05T08:03:45.539957Z",
+     "iopub.status.busy": "2025-07-05T08:03:45.539471Z",
+     "iopub.status.idle": "2025-07-05T08:03:50.954695Z",
+     "shell.execute_reply": "2025-07-05T08:03:50.953913Z",
+     "shell.execute_reply.started": "2025-07-05T08:03:45.539931Z"
+    },
+    "trusted": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Question:  Tại sao nam giới có nguy cơ mắc bệnh gout cao hơn phụ nữ?\n",
+      "\n",
+      "<think>\n",
+      "\n",
+      "\n",
+      "Nam giới có nguy cơ mắc bệnh gout cao hơn phụ nữ. Nguyên nhân là do nam giới có hệ vi khuẩn Pseudomonas trong cơ thể cao hơn so với nữ giới. Vi khuẩn này gây ra các sản phẩm tích tụ trong các sụn khớp, từ đó gây ra bệnh gout.\n",
+      "</think>\n",
+      "Nam giới có nguy cơ mắc bệnh gout cao hơn phụ nữ vì có hệ vi khuẩn Pseudomonas trong cơ thể cao hơn so với nữ giới.\n"
+     ]
+    }
+   ],
+   "source": [
+    "question = training_samples[10]['question']\n",
+    "inputs = tokenizer(\n",
+    "    [inference_prompt_style.format(question) + tokenizer.eos_token],\n",
+    "    return_tensors=\"pt\"\n",
+    ").to(\"cuda\")\n",
+    "\n",
+    "outputs = model.generate(\n",
+    "    input_ids=inputs.input_ids,\n",
+    "    attention_mask=inputs.attention_mask,\n",
+    "    max_new_tokens=1200,\n",
+    "    eos_token_id=tokenizer.eos_token_id,\n",
+    "    use_cache=True,\n",
+    ")\n",
+    "response = tokenizer.batch_decode(outputs, skip_special_tokens=True)\n",
+    "print(\"Question: \", question)\n",
+    "print(response[0].split(\"### Response:\")[1])"
+   ]
+  }
+ ],
+ "metadata": {
+  "kaggle": {
+   "accelerator": "gpu",
+   "dataSources": [],
+   "dockerImageVersionId": 31041,
+   "isGpuEnabled": true,
+   "isInternetEnabled": true,
+   "language": "python",
+   "sourceType": "notebook"
+  },
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.11"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 4
+}