kingabzpro
/

gpt-oss-20b-dermatology-qa

+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Setting Up"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "%%capture\n",
+    "%pip install -U accelerate \n",
+    "%pip install -U peft \n",
+    "%pip install -U trl \n",
+    "%pip install -U bitsandbytes\n",
+    "%pip install -U transformers\n",
+    "%pip install -U tensorboard\n",
+    "%pip install -U openai-harmony\n",
+    "%pip install -U tiktoken\n",
+    "%pip install -U pyctcdecode"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Note: Environment variable`HF_TOKEN` is set and is the current active token independently from the token you've just configured.\n"
+     ]
+    }
+   ],
+   "source": [
+    "from huggingface_hub import login\n",
+    "import os\n",
+    "HF_TOKEN= os.getenv(\"HF_TOKEN\")\n",
+    "\n",
+    "login(HF_TOKEN)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Configs"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "BASE_MODEL_ID = \"openai/gpt-oss-20b\"\n",
+    "SAVED_MODEL_ID = \"gpt-oss-20b-dermatology-qa\"\n",
+    "DATASET_NAME = \"kingabzpro/dermatology-qa-firecrawl-dataset\""
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Loading the model and tokenizer"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "1a21fc931ff7479896898c2bfaefaaa3",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Loading checkpoint shards:   0%|          | 0/3 [00:00<?, ?it/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "import torch\n",
+    "from transformers import AutoModelForCausalLM, AutoTokenizer, Mxfp4Config\n",
+    "\n",
+    "quantization_config = Mxfp4Config(dequantize=True)\n",
+    "model_kwargs = dict(\n",
+    "    attn_implementation=\"eager\",\n",
+    "    torch_dtype=torch.bfloat16,\n",
+    "    quantization_config=quantization_config,\n",
+    "    use_cache=False,\n",
+    "    device_map=\"auto\",\n",
+    ")\n",
+    "\n",
+    "model = AutoModelForCausalLM.from_pretrained(BASE_MODEL_ID, **model_kwargs)\n",
+    "tokenizer = AutoTokenizer.from_pretrained(BASE_MODEL_ID)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Loading and processing the dataset"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from openai_harmony import (\n",
+    "    Conversation,\n",
+    "    DeveloperContent,\n",
+    "    HarmonyEncodingName,\n",
+    "    Message,\n",
+    "    Role,\n",
+    "    load_harmony_encoding,\n",
+    ")\n",
+    "\n",
+    "# Load the Harmony encoder once\n",
+    "enc = load_harmony_encoding(HarmonyEncodingName.HARMONY_GPT_OSS)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "DERM_DEV_INSTRUCTIONS = (\n",
+    "    \"You are a board-certified dermatologist answering various dermatology questions.\"\n",
+    "    \" Answer clearly in 1–3 sentences. No speculation.\"\n",
+    ")\n",
+    "\n",
+    "\n",
+    "def render_pair_harmony(question: str, answer: str) -> str:\n",
+    "    \"\"\"Harmony-formatted prompt for training.\"\"\"\n",
+    "    convo = Conversation.from_messages(\n",
+    "        [\n",
+    "            Message.from_role_and_content(\n",
+    "                Role.DEVELOPER,\n",
+    "                DeveloperContent.new().with_instructions(DERM_DEV_INSTRUCTIONS),\n",
+    "            ),\n",
+    "            Message.from_role_and_content(Role.USER, question.strip()),\n",
+    "            Message.from_role_and_content(Role.ASSISTANT, answer.strip()),\n",
+    "        ]\n",
+    "    )\n",
+    "    tokens = enc.render_conversation(convo)\n",
+    "    return enc.decode(tokens)\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Parameter 'function'=<function to_harmony_batch at 0x7aa95e0afd80> of the transform datasets.arrow_dataset.Dataset._map_single couldn't be hashed properly, a random hash was used instead. Make sure your transforms and parameters are serializable with pickle or dill for the dataset fingerprinting and caching to work. If you reuse this transform, the caching mechanism will consider it to be different from the previous calls and recompute everything. This warning is only showed once. Subsequent hashing failures won't be showed.\n"
+     ]
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "afb999e8af5849d4955eaf0a26fbe17f",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Map:   0%|          | 0/1001 [00:00<?, ? examples/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "DatasetDict({\n",
+      "    train: Dataset({\n",
+      "        features: ['question', 'answer', 'condition', 'difficulty', 'source_url', 'text'],\n",
+      "        num_rows: 900\n",
+      "    })\n",
+      "    test: Dataset({\n",
+      "        features: ['question', 'answer', 'condition', 'difficulty', 'source_url', 'text'],\n",
+      "        num_rows: 101\n",
+      "    })\n",
+      "})\n",
+      "<|start|>developer<|message|># Instructions\n",
+      "\n",
+      "You are a board-certified dermatologist answering various dermatology questions. Answer clearly in 1–3 sentences. No speculation.<|end|><|start|>user<|message|>What type of skin changes accompany the pustules in GPP?<|end|><|start|>assistant<|message|>The skin surrounding the pustules becomes erythematous, which means it appears red and inflamed. The affected skin is also painful. These changes occur during the recurrent flares of the disease.<|end|>\n"
+     ]
+    }
+   ],
+   "source": [
+    "from datasets import load_dataset\n",
+    "\n",
+    "# Load dataset\n",
+    "dataset = load_dataset(\"kingabzpro/dermatology-qa-firecrawl-dataset\", split=\"train\")\n",
+    "\n",
+    "\n",
+    "def to_harmony_batch(examples: dict) -> dict:\n",
+    "    \"\"\"Convert batch of dermatology Q&A pairs to harmony format.\"\"\"\n",
+    "    questions = examples[\"question\"]\n",
+    "    answers = examples[\"answer\"]\n",
+    "\n",
+    "    formatted_texts = []\n",
+    "    for question, answer in zip(questions, answers):\n",
+    "        formatted_text = render_pair_harmony(question.strip(), answer.strip())\n",
+    "        formatted_texts.append(formatted_text)\n",
+    "\n",
+    "    return {\"text\": formatted_texts}\n",
+    "\n",
+    "\n",
+    "# Process dataset\n",
+    "dataset = dataset.map(to_harmony_batch, batched=True)\n",
+    "dataset = dataset.train_test_split(test_size=0.1, seed=42)\n",
+    "\n",
+    "print(dataset)\n",
+    "\n",
+    "print(dataset[\"train\"][0][\"text\"])\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Model inference before fine-tuning"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def render_inference_harmony(question: str) -> str:\n",
+    "    \"\"\"Harmony-formatted prompt for inference.\"\"\"\n",
+    "    convo = Conversation.from_messages(\n",
+    "        [\n",
+    "            Message.from_role_and_content(\n",
+    "                Role.DEVELOPER,\n",
+    "                DeveloperContent.new().with_instructions(DERM_DEV_INSTRUCTIONS),\n",
+    "            ),\n",
+    "            Message.from_role_and_content(Role.USER, question.strip()),\n",
+    "        ]\n",
+    "    )\n",
+    "    tokens = enc.render_conversation_for_completion(convo, Role.ASSISTANT)\n",
+    "    return enc.decode(tokens)\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "<|start|>developer<|message|># Instructions\n",
+      "\n",
+      "You are a board-certified dermatologist answering various dermatology questions. Answer clearly in 1–3 sentences. No speculation.<|end|><|start|>user<|message|>Why might winter be a problematic season for some people with eczema?<|end|><|start|>assistant<|channel|>analysis<|message|>They ask: \"Why might winter be a problematic season for some people with eczema?\" A dermatologist must answer succinctly. We'll provide reasons: cold, dry air, indoor heating increases dryness, reduces skin barrier, triggers flare-ups. Also less humidity helps dryness, exposure to indoor allergens, etc. Provide 1-3 sentences. Must be no speculation. Provide factual explanation. Must answer clearly.<|end|><|start|>assistant<|channel|>final<|message|>Winter can trigger eczema flare‑ups because cold, dry air and indoor heating strip the skin of moisture, compromising the skin barrier and making it more prone to irritation and infection. Lower humidity also increases scratching and can worsen inflammation, so maintaining skin hydration is particularly important during the colder months.<|return|>\n"
+     ]
+    }
+   ],
+   "source": [
+    "question = dataset[\"test\"][20][\"question\"]\n",
+    "\n",
+    "text = render_inference_harmony(question)\n",
+    "\n",
+    "inputs = tokenizer(text, return_tensors=\"pt\").to(\"cuda\")\n",
+    "outputs = model.generate(\n",
+    "    input_ids=inputs.input_ids,\n",
+    "    attention_mask=inputs.attention_mask,\n",
+    "    max_new_tokens=200,\n",
+    "    eos_token_id=tokenizer.eos_token_id,\n",
+    "    use_cache=True,\n",
+    ")\n",
+    "response = tokenizer.batch_decode(outputs)\n",
+    "print(response[0])\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Winter can trigger eczema flare‑ups because cold, dry air and indoor heating strip the skin of moisture, compromising the skin barrier and making it more prone to irritation and infection. Lower humidity also increases scratching and can worsen inflammation, so maintaining skin hydration is particularly important during the colder months.\n"
+     ]
+    }
+   ],
+   "source": [
+    "start_idx = response[0].find(\"<|start|>assistant<|channel|>final<|message|>\") + \\\n",
+    "            len(\"<|start|>assistant<|channel|>final<|message|>\")\n",
+    "end_idx = response[0].rfind(\"<|return|>\") if \"<|return|>\" in response[0] else len(response[0])\n",
+    "final_answer = response[0][start_idx:end_idx].strip()\n",
+    "print(final_answer)\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "'During winter, indoor air tends to be dry, which can trigger eczema flare‑ups for some individuals. The dryness of indoor environments in winter is a known trigger for these patients.'"
+      ]
+     },
+     "execution_count": 11,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "dataset[\"test\"][20][\"answer\"]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Setting up the model"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "trainable params: 15,040,512 || all params: 20,929,797,696 || trainable%: 0.0719\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/usr/local/lib/python3.11/dist-packages/peft/tuners/lora/layer.py:159: UserWarning: Unsupported layer type '<class 'transformers.models.gpt_oss.modeling_gpt_oss.GptOssExperts'>' encountered, proceed at your own risk.\n",
+      "  warnings.warn(\n"
+     ]
+    }
+   ],
+   "source": [
+    "from peft import LoraConfig, get_peft_model\n",
+    "\n",
+    "peft_config = LoraConfig(\n",
+    "    r=8,\n",
+    "    lora_alpha=16,\n",
+    "    target_modules=\"all-linear\",\n",
+    "    target_parameters=[\n",
+    "        \"7.mlp.experts.gate_up_proj\",\n",
+    "        \"7.mlp.experts.down_proj\",\n",
+    "        \"15.mlp.experts.gate_up_proj\",\n",
+    "        \"15.mlp.experts.down_proj\",\n",
+    "        \"23.mlp.experts.gate_up_proj\",\n",
+    "        \"23.mlp.experts.down_proj\",\n",
+    "    ],\n",
+    ")\n",
+    "peft_model = get_peft_model(model, peft_config)\n",
+    "peft_model.print_trainable_parameters()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from trl import SFTConfig\n",
+    "\n",
+    "training_args = SFTConfig(\n",
+    "    learning_rate=2e-4,\n",
+    "    gradient_checkpointing=True,\n",
+    "    num_train_epochs=1,\n",
+    "    logging_steps=10,\n",
+    "    bf16=True,\n",
+    "    per_device_train_batch_size=8,\n",
+    "    per_device_eval_batch_size=8,\n",
+    "    gradient_accumulation_steps=2,\n",
+    "    max_length=2048,\n",
+    "    warmup_ratio=0.03,\n",
+    "    eval_strategy=\"steps\",\n",
+    "    eval_steps=10,\n",
+    "    lr_scheduler_type=\"cosine_with_min_lr\",\n",
+    "    lr_scheduler_kwargs={\"min_lr_rate\": 0.1},\n",
+    "    output_dir=SAVED_MODEL_ID,\n",
+    "    report_to=\"tensorboard\",\n",
+    "    push_to_hub=True,\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Model Training"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 14,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "78071bc85662408ebcc727e8de0f9ec7",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Adding EOS to train dataset:   0%|          | 0/900 [00:00<?, ? examples/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "91c71a17c98b4465b5573711b65aaca3",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Tokenizing train dataset:   0%|          | 0/900 [00:00<?, ? examples/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "c1de460d7e7b4fbc96c446cfa20ec591",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Truncating train dataset:   0%|          | 0/900 [00:00<?, ? examples/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "e5f57bfd84064385b63a4df24da2c93d",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Adding EOS to eval dataset:   0%|          | 0/101 [00:00<?, ? examples/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "cbea58e54f7949c39deea56ceb637266",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Tokenizing eval dataset:   0%|          | 0/101 [00:00<?, ? examples/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "3d3f75508723415f870bdbac32c88ea3",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Truncating eval dataset:   0%|          | 0/101 [00:00<?, ? examples/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "text/html": [
+       "\n",
+       "    <div>\n",
+       "      \n",
+       "      <progress value='57' max='57' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
+       "      [57/57 06:35, Epoch 1/1]\n",
+       "    </div>\n",
+       "    <table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       " <tr style=\"text-align: left;\">\n",
+       "      <th>Step</th>\n",
+       "      <th>Training Loss</th>\n",
+       "      <th>Validation Loss</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <td>10</td>\n",
+       "      <td>4.970200</td>\n",
+       "      <td>2.089929</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>20</td>\n",
+       "      <td>1.454900</td>\n",
+       "      <td>0.981939</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>30</td>\n",
+       "      <td>0.871900</td>\n",
+       "      <td>0.867009</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>40</td>\n",
+       "      <td>0.830900</td>\n",
+       "      <td>0.836862</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>50</td>\n",
+       "      <td>0.845000</td>\n",
+       "      <td>0.823363</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table><p>"
+      ],
+      "text/plain": [
+       "<IPython.core.display.HTML object>"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "text/plain": [
+       "TrainOutput(global_step=57, training_loss=1.6722588371812253, metrics={'train_runtime': 402.1596, 'train_samples_per_second': 2.238, 'train_steps_per_second': 0.142, 'total_flos': 1.1781569356397568e+16, 'train_loss': 1.6722588371812253})"
+      ]
+     },
+     "execution_count": 14,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from trl import SFTTrainer\n",
+    "\n",
+    "trainer = SFTTrainer(\n",
+    "    model=peft_model,\n",
+    "    args=training_args,\n",
+    "    train_dataset=dataset[\"train\"],\n",
+    "    eval_dataset=dataset[\"test\"],\n",
+    "    processing_class=tokenizer,\n",
+    ")\n",
+    "trainer.train()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "217e9aaff6574d159a1a988ff583ff3c",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Processing Files (0 / 0)                : |          |  0.00B /  0.00B            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "9a751f3aff01463499df49d9975252a8",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "New Data Upload                         : |          |  0.00B /  0.00B            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "a37515d0d5444c4194d40b60517f89ac",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  ...events.1756035182.51336aae7b3d.93.0: 100%|##########| 6.77kB / 6.77kB            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "08b221ee56ce42c7ae1e4b7c97e54b08",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  ...events.1756035572.51336aae7b3d.93.1: 100%|##########| 10.3kB / 10.3kB            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "a1dd80827c8240cca48b2f62624678ec",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  ...ents.1756037571.51336aae7b3d.2438.0: 100%|##########| 6.45kB / 6.45kB            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "be6333ce8ef3415db35a755e930aa85c",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  ...ents.1756037458.51336aae7b3d.2174.0: 100%|##########| 6.45kB / 6.45kB            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "e37affcd1ca64ee0b4e206cbe244a117",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  ...ents.1756037652.51336aae7b3d.2641.0: 100%|##########| 10.4kB / 10.4kB            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "4062cbde5d2a46c1bc3b55556c10bcf2",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  ...0b-dermatology-qa/training_args.bin: 100%|##########| 6.16kB / 6.16kB            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "5bbb5e92548e430c98d9fde415d36c82",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  ...s-20b-dermatology-qa/tokenizer.json: 100%|##########| 27.9MB / 27.9MB            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "53c63643ee9643f4af1d8016c8dbc32f",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  ...tology-qa/adapter_model.safetensors:  70%|######9   | 41.8MB / 60.2MB            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "No files have been modified since last commit. Skipping to prevent empty commit.\n"
+     ]
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "29576445acd942f499a65f3687e25eaf",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Processing Files (0 / 0)                : |          |  0.00B /  0.00B            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "7c133dd9961643bd9ed042dfe7f67a12",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "New Data Upload                         : |          |  0.00B /  0.00B            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "016b81a696b3490589db33a5a92dd7eb",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  ...events.1756035182.51336aae7b3d.93.0: 100%|##########| 6.77kB / 6.77kB            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "60e93471be1144f0a056dee1f2dbdcbe",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  ...events.1756035572.51336aae7b3d.93.1: 100%|##########| 10.3kB / 10.3kB            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "e7bbd3b9fc604f9289257cbe876ccda6",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  ...ents.1756037458.51336aae7b3d.2174.0: 100%|##########| 6.45kB / 6.45kB            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "ee7018041db44537b4d9e16909768f5f",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  ...ents.1756037571.51336aae7b3d.2438.0: 100%|##########| 6.45kB / 6.45kB            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "9375111063c740509aa2046131404269",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  ...ents.1756037652.51336aae7b3d.2641.0: 100%|##########| 10.4kB / 10.4kB            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "cfe5771010214e9197c21f990e2840da",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  ...0b-dermatology-qa/training_args.bin: 100%|##########| 6.16kB / 6.16kB            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "da6a258f9d464998a5b1ae264121f97a",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  ...tology-qa/adapter_model.safetensors:  56%|#####5    | 33.6MB / 60.2MB            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "931788c4fdfb4a47ac8b8cefe36cd54b",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  ...s-20b-dermatology-qa/tokenizer.json: 100%|##########| 27.9MB / 27.9MB            "
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "text/plain": [
+       "CommitInfo(commit_url='https://huggingface.co/kingabzpro/gpt-oss-20b-dermatology-qa/commit/b1706fde1cbc1942ccf763061fa31b22e5b61cc6', commit_message='End of training', commit_description='', oid='b1706fde1cbc1942ccf763061fa31b22e5b61cc6', pr_url=None, repo_url=RepoUrl('https://huggingface.co/kingabzpro/gpt-oss-20b-dermatology-qa', endpoint='https://huggingface.co', repo_type='model', repo_id='kingabzpro/gpt-oss-20b-dermatology-qa'), pr_revision=None, pr_num=None)"
+      ]
+     },
+     "execution_count": 15,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "trainer.save_model(SAVED_MODEL_ID)\n",
+    "trainer.push_to_hub(dataset_name=SAVED_MODEL_ID)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Model inference after fine-tuning"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "MXFP4 quantization requires triton >= 3.4.0 and kernels installed, we will default to dequantizing the model to bf16\n"
+     ]
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "dc0cfff4f43a4675b78186cdf5625377",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Loading checkpoint shards:   0%|          | 0/3 [00:00<?, ?it/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/usr/local/lib/python3.11/dist-packages/peft/tuners/lora/layer.py:159: UserWarning: Unsupported layer type '<class 'transformers.models.gpt_oss.modeling_gpt_oss.GptOssExperts'>' encountered, proceed at your own risk.\n",
+      "  warnings.warn(\n"
+     ]
+    }
+   ],
+   "source": [
+    "from peft import PeftModel\n",
+    "from transformers import AutoModelForCausalLM, AutoTokenizer\n",
+    "\n",
+    "BASE_MODEL_ID = \"openai/gpt-oss-20b\"\n",
+    "SAVED_LORA_MODEL_ID = \"gpt-oss-20b-dermatology-qa\"\n",
+    "\n",
+    "# Load the tokenizer\n",
+    "tokenizer = AutoTokenizer.from_pretrained(BASE_MODEL_ID)\n",
+    "\n",
+    "# Load the original model first\n",
+    "model_kwargs = dict(\n",
+    "    attn_implementation=\"eager\", torch_dtype=\"auto\", use_cache=True, device_map=\"cuda\"\n",
+    ")\n",
+    "base_model = AutoModelForCausalLM.from_pretrained(\n",
+    "    BASE_MODEL_ID, **model_kwargs\n",
+    ")\n",
+    "\n",
+    "# Merge fine-tuned weights with the base model\n",
+    "model = PeftModel.from_pretrained(base_model, SAVED_LORA_MODEL_ID)\n",
+    "model = model.merge_and_unload()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from datasets import load_dataset\n",
+    "\n",
+    "# Load dataset\n",
+    "dataset = load_dataset(\"kingabzpro/dermatology-qa-firecrawl-dataset\", split=\"train\")\n",
+    "dataset = dataset.train_test_split(test_size=0.1, seed=42)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from openai_harmony import (\n",
+    "    Conversation,\n",
+    "    DeveloperContent,\n",
+    "    HarmonyEncodingName,\n",
+    "    Message,\n",
+    "    Role,\n",
+    "    load_harmony_encoding,\n",
+    ")\n",
+    "\n",
+    "# Load the Harmony encoder once\n",
+    "enc = load_harmony_encoding(HarmonyEncodingName.HARMONY_GPT_OSS)\n",
+    "\n",
+    "DERM_DEV_INSTRUCTIONS = (\n",
+    "    \"You are a board-certified dermatologist answering various dermatology questions.\"\n",
+    "    \" Answer clearly in 1–3 sentences. No speculation.\"\n",
+    ")\n",
+    "\n",
+    "def render_inference_harmony(question: str) -> str:\n",
+    "    \"\"\"Harmony-formatted prompt for inference.\"\"\"\n",
+    "    convo = Conversation.from_messages(\n",
+    "        [\n",
+    "            Message.from_role_and_content(\n",
+    "                Role.DEVELOPER,\n",
+    "                DeveloperContent.new().with_instructions(DERM_DEV_INSTRUCTIONS),\n",
+    "            ),\n",
+    "            Message.from_role_and_content(Role.USER, question.strip()),\n",
+    "        ]\n",
+    "    )\n",
+    "    tokens = enc.render_conversation_for_completion(convo, Role.ASSISTANT)\n",
+    "    return enc.decode(tokens)\n",
+    "\n",
+    "def extract_final_answer(text):\n",
+    "    # Find the start of the assistant's final message\n",
+    "    start_marker = \"<|start|>assistant<|message|>\"\n",
+    "    start_idx = text.find(start_marker)\n",
+    "    \n",
+    "    if start_idx == -1:\n",
+    "        return \"No answer found in the text\"\n",
+    "    \n",
+    "    # Move to the beginning of the actual answer\n",
+    "    start_idx += len(start_marker)\n",
+    "    \n",
+    "    # Find the end of the answer (either next tag or end of text)\n",
+    "    end_idx = text.find(\"<|end|>\", start_idx)\n",
+    "    if end_idx == -1:\n",
+    "        end_idx = len(text)\n",
+    "    \n",
+    "    # Extract and clean the answer\n",
+    "    answer = text[start_idx:end_idx].strip()\n",
+    "    \n",
+    "    return answer"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "During winter, the dry skin that is typical in eczema can become even more dry, which may worsen eczema symptoms. The lack of moisture in the air can increase skin dryness.\n"
+     ]
+    }
+   ],
+   "source": [
+    "question = dataset[\"test\"][20][\"question\"]\n",
+    "\n",
+    "text = render_inference_harmony(question)\n",
+    "\n",
+    "inputs = tokenizer(text, return_tensors=\"pt\").to(\"cuda\")\n",
+    "outputs = model.generate(\n",
+    "    input_ids=inputs.input_ids,\n",
+    "    attention_mask=inputs.attention_mask,\n",
+    "    max_new_tokens=200,\n",
+    "    eos_token_id=tokenizer.eos_token_id,\n",
+    "    use_cache=True,\n",
+    ")\n",
+    "response = tokenizer.batch_decode(outputs)\n",
+    "final_answer = extract_final_answer(response[0])\n",
+    "print(final_answer)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 14,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "'<|start|>developer<|message|># Instructions\\n\\nYou are a board-certified dermatologist answering various dermatology questions. Answer clearly in 1–3 sentences. No speculation.<|end|><|start|>user<|message|>How does the source suggest clinicians approach the diagnosis of rosacea?<|end|><|start|>assistant'"
+      ]
+     },
+     "execution_count": 14,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "text"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "'During winter, indoor air tends to be dry, which can trigger eczema flare‑ups for some individuals. The dryness of indoor environments in winter is a known trigger for these patients.'"
+      ]
+     },
+     "execution_count": 11,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "dataset[\"test\"][20][\"answer\"]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "The source suggests that clinicians approach the diagnosis of rosacea as a dynamic process that requires ongoing reassessment as patients develop new symptoms or present new presentations, rather than a one-time determination. This approach is intended to address changing manifestations within patients and evolving presentations in the population.\n"
+     ]
+    }
+   ],
+   "source": [
+    "question = dataset[\"test\"][50][\"question\"]\n",
+    "\n",
+    "text = render_inference_harmony(question)\n",
+    "\n",
+    "inputs = tokenizer(text, return_tensors=\"pt\").to(\"cuda\")\n",
+    "outputs = model.generate(\n",
+    "    input_ids=inputs.input_ids,\n",
+    "    attention_mask=inputs.attention_mask,\n",
+    "    max_new_tokens=200,\n",
+    "    eos_token_id=tokenizer.eos_token_id,\n",
+    "    use_cache=True,\n",
+    ")\n",
+    "response = tokenizer.batch_decode(outputs)\n",
+    "final_answer = extract_final_answer(response[0])\n",
+    "print(final_answer)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "'The source suggests using a stepped approach, which typically involves evaluating the patient and then progressing through treatment options as needed. The text also mentions a differential diagnosis list to aid in distinguishing rosacea from other similar conditions.'"
+      ]
+     },
+     "execution_count": 13,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "dataset[\"test\"][50][\"answer\"]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "1ea55abf1ec6411f88a9e1c7bcf90446",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Loading checkpoint shards:   0%|          | 0/3 [00:00<?, ?it/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Device set to use cuda\n"
+     ]
+    }
+   ],
+   "source": [
+    "from transformers import pipeline\n",
+    "\n",
+    "# Load pipeline\n",
+    "generator = pipeline(\n",
+    "    \"text-generation\",\n",
+    "    model=\"kingabzpro/gpt-oss-20b-dermatology-qa\",\n",
+    "    device=\"cuda\"  # or device=0\n",
+    ")\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "The source advises that clinicians should not rely solely on clinical presentation to diagnose rosacea. Instead, they should use a standardized, validated diagnostic tool such as the 2016 International Rosacea Consensus (IRC) criteria to confirm the diagnosis. This approach ensures a consistent and evidence‑based assessment rather than a subjective interpretation of symptoms.\n"
+     ]
+    }
+   ],
+   "source": [
+    "question = \"How does the source suggest clinicians approach the diagnosis of rosacea?\"\n",
+    "\n",
+    "output = generator(\n",
+    "    [{\"role\": \"user\", \"content\": question}],\n",
+    "    max_new_tokens=200,\n",
+    "    return_full_text=False\n",
+    ")[0]\n",
+    "\n",
+    "print(output[\"generated_text\"])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "The source indicates that clinicians should consider rosacea when patients present with erythematous facial skin and may need to differentiate it from other conditions such as acne. Recognizing these features helps in identifying rosacea.\n"
+     ]
+    }
+   ],
+   "source": [
+    "prompt = \"<|start|>developer<|message|># Instructions\\n\\nYou are a board-certified dermatologist answering various dermatology questions. Answer clearly in 1–3 sentences. No speculation.<|end|><|start|>user<|message|>How does the source suggest clinicians approach the diagnosis of rosacea?<|end|><|start|>assistant\"\n",
+    "\n",
+    "output = generator(\n",
+    "    prompt,\n",
+    "    max_new_tokens=200,\n",
+    "    return_full_text=False\n",
+    ")[0]\n",
+    "\n",
+    "print(output[\"generated_text\"])"
+   ]
+  }
+ ],
+ "metadata": {
+  "kaggle": {
+   "accelerator": "nvidiaTeslaT4",
+   "dataSources": [],
+   "dockerImageVersionId": 31011,
+   "isGpuEnabled": true,
+   "isInternetEnabled": true,
+   "language": "python",
+   "sourceType": "notebook"
+  },
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.11"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 4
+}