unslothai · mmathew23 · Nov 18, 2025
diff --git a/nb/Advanced_Llama3_2_(3B)_GRPO_LoRA.ipynb b/nb/Advanced_Llama3_2_(3B)_GRPO_LoRA.ipynb
@@ -3,8 +3,8 @@
   {
    "cell_type": "markdown",
    "metadata": {
-    "id": "view-in-github",
-    "colab_type": "text"
+    "colab_type": "text",
+    "id": "view-in-github"
    },
    "source": [
     "<a href=\"https://colab.research.google.com/github/unslothai/notebooks/blob/main/nb/Advanced_Llama3_2_(3B)_GRPO_LoRA.ipynb\" target=\"_parent\"><img src=\"https://colab.research.google.com/assets/colab-badge.svg\" alt=\"Open In Colab\"/></a>"
@@ -1257,7 +1257,7 @@
     "    lr_scheduler_type = \"cosine\",\n",
     "    optim = \"adamw_8bit\",\n",
     "    logging_steps = 1,\n",
-    "    per_device_train_batch_size = 1,\n",
+    "    per_device_train_batch_size = 4,\n",
     "    gradient_accumulation_steps = 4, # Increase to 4 for smoother training\n",
     "    num_generations = 4, # Decrease if out of memory\n",
     "    max_prompt_length = max_prompt_length,\n",
@@ -12746,8 +12746,8 @@
   "accelerator": "GPU",
   "colab": {
    "gpuType": "T4",
-   "provenance": [],
-   "include_colab_link": true
+   "include_colab_link": true,
+   "provenance": []
   },
   "kernelspec": {
    "display_name": "Python 3",

diff --git a/nb/DeepSeek_R1_0528_Qwen3_(8B)_GRPO.ipynb b/nb/DeepSeek_R1_0528_Qwen3_(8B)_GRPO.ipynb
@@ -1711,7 +1711,7 @@
     "    lr_scheduler_type = \"linear\",\n",
     "    optim = \"adamw_8bit\",\n",
     "    logging_steps = 1,\n",
-    "    per_device_train_batch_size = 1,\n",
+    "    per_device_train_batch_size = 4,\n",
     "    gradient_accumulation_steps = 1, # Increase to 4 for smoother training\n",
     "    num_generations = 4, # Decrease if out of memory\n",
     "    max_prompt_length = max_prompt_length,\n",

diff --git a/nb/Gemma3_(1B)-GRPO.ipynb b/nb/Gemma3_(1B)-GRPO.ipynb
diff --git a/nb/Gemma3_(4B)-Vision-GRPO.ipynb b/nb/Gemma3_(4B)-Vision-GRPO.ipynb
@@ -1114,7 +1114,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 14,
+   "execution_count": null,
    "metadata": {
     "colab": {
      "base_uri": "https://localhost:8080/"
@@ -1144,7 +1144,7 @@
     "    lr_scheduler_type = \"cosine\",\n",
     "    optim = \"adamw_8bit\",\n",
     "    logging_steps = 1,\n",
-    "    per_device_train_batch_size = 1,\n",
+    "    per_device_train_batch_size = 4,\n",
     "    gradient_accumulation_steps = 2, # Increase to 4 for smoother training\n",
     "    num_generations = 4, # Decrease if out of memory\n",
     "    max_prompt_length = 1024,\n",

diff --git a/nb/HuggingFace Course-Advanced_Llama3_1_(3B)_GRPO_LoRA.ipynb b/nb/HuggingFace Course-Advanced_Llama3_1_(3B)_GRPO_LoRA.ipynb
@@ -819,7 +819,7 @@
     "    lr_scheduler_type = \"cosine\",\n",
     "    optim = \"adamw_torch_fused\",\n",
     "    logging_steps = 1,\n",
-    "    per_device_train_batch_size = 1,\n",
+    "    per_device_train_batch_size = 8,\n",
     "    gradient_accumulation_steps = 4, # Increase to 4 for smoother training\n",
     "    num_generations = 8, # Decrease if out of memory\n",
     "    max_prompt_length = max_prompt_length,\n",

diff --git a/nb/HuggingFace Course-Advanced_Llama3_2_(3B)_GRPO_LoRA.ipynb b/nb/HuggingFace Course-Advanced_Llama3_2_(3B)_GRPO_LoRA.ipynb
@@ -3,8 +3,8 @@
   {
    "cell_type": "markdown",
    "metadata": {
-    "id": "view-in-github",
-    "colab_type": "text"
+    "colab_type": "text",
+    "id": "view-in-github"
    },
    "source": [
     "<a href=\"https://colab.research.google.com/github/unslothai/notebooks/blob/main/nb/Advanced_Llama3_2_(3B)_GRPO_LoRA.ipynb\" target=\"_parent\"><img src=\"https://colab.research.google.com/assets/colab-badge.svg\" alt=\"Open In Colab\"/></a>"
@@ -1257,7 +1257,7 @@
     "    lr_scheduler_type = \"cosine\",\n",
     "    optim = \"adamw_8bit\",\n",
     "    logging_steps = 1,\n",
-    "    per_device_train_batch_size = 1,\n",
+    "    per_device_train_batch_size = 4,\n",
     "    gradient_accumulation_steps = 4, # Increase to 4 for smoother training\n",
     "    num_generations = 4, # Decrease if out of memory\n",
     "    max_prompt_length = max_prompt_length,\n",
@@ -12746,8 +12746,8 @@
   "accelerator": "GPU",
   "colab": {
    "gpuType": "T4",
-   "provenance": [],
-   "include_colab_link": true
+   "include_colab_link": true,
+   "provenance": []
   },
   "kernelspec": {
    "display_name": "Python 3",

diff --git a/nb/HuggingFace Course-DeepSeek_R1_0528_Qwen3_(8B)_GRPO.ipynb b/nb/HuggingFace Course-DeepSeek_R1_0528_Qwen3_(8B)_GRPO.ipynb
@@ -1713,7 +1713,7 @@
     "    lr_scheduler_type = \"linear\",\n",
     "    optim = \"adamw_8bit\",\n",
     "    logging_steps = 1,\n",
-    "    per_device_train_batch_size = 1,\n",
+    "    per_device_train_batch_size = 4,\n",
     "    gradient_accumulation_steps = 1, # Increase to 4 for smoother training\n",
     "    num_generations = 4, # Decrease if out of memory\n",
     "    max_prompt_length = max_prompt_length,\n",