unslothai · Sneakr · Dec 18, 2025 · Dec 18, 2025 · Dec 18, 2025
diff --git a/nb/CodeForces-cot-Finetune_for_Reasoning_on_CodeForces.ipynb b/nb/CodeForces-cot-Finetune_for_Reasoning_on_CodeForces.ipynb
@@ -253,8 +253,8 @@
     "    # [NEW] \"unsloth\" uses 30% less VRAM, fits 2x larger batch sizes!\n",
     "    use_gradient_checkpointing = \"unsloth\", # True or \"unsloth\" for very long context\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     ")"
    ]
   },

diff --git a/nb/CodeGemma_(7B)-Conversational.ipynb b/nb/CodeGemma_(7B)-Conversational.ipynb
@@ -153,8 +153,8 @@
     "    bias = \"none\",    # Supports any, but = \"none\" is optimized\n",
     "    use_gradient_checkpointing = \"unsloth\", # True or \"unsloth\" for very long context\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     ")"
    ]
   },

diff --git a/nb/Deepseek_OCR_(3B)-Eval.ipynb b/nb/Deepseek_OCR_(3B)-Eval.ipynb
@@ -541,8 +541,8 @@
     "    lora_dropout = 0,\n",
     "    bias = \"none\",\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     "    # target_modules = \"all-linear\", # Optional now! Can specify a list if needed\n",
     ")"
    ]

diff --git a/nb/Deepseek_OCR_(3B)-Evaluation.ipynb b/nb/Deepseek_OCR_(3B)-Evaluation.ipynb
@@ -694,8 +694,8 @@
     "    lora_dropout = 0,\n",
     "    bias = \"none\",\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     "    # target_modules = \"all-linear\", # Optional now! Can specify a list if needed\n",
     ")"
    ]

diff --git a/nb/Deepseek_OCR_(3B).ipynb b/nb/Deepseek_OCR_(3B).ipynb
@@ -541,8 +541,8 @@
     "    lora_dropout = 0,\n",
     "    bias = \"none\",\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     "    # target_modules = \"all-linear\", # Optional now! Can specify a list if needed\n",
     ")"
    ]

diff --git a/nb/ERNIE_4_5_21B_A3B_PT-Conversational.ipynb b/nb/ERNIE_4_5_21B_A3B_PT-Conversational.ipynb
@@ -618,8 +618,8 @@
     "    # [NEW] \"unsloth\" uses 30% less VRAM, fits 2x larger batch sizes!\n",
     "    use_gradient_checkpointing = \"unsloth\", # True or \"unsloth\" for very long context\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     ")"
    ]
   },

diff --git a/nb/ERNIE_4_5_VL_28B_A3B_PT_Vision.ipynb b/nb/ERNIE_4_5_VL_28B_A3B_PT_Vision.ipynb
@@ -875,7 +875,7 @@
     "    lora_dropout = 0,\n",
     "    bias = \"none\",\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
     "    target_modules = [\n",
     "        \"q_proj\", \"k_proj\", \"v_proj\", \"o_proj\",\n",
     "        \"gate_proj\", \"up_proj\", \"down_proj\",\n",

diff --git a/nb/Gemma2_(2B)-Alpaca.ipynb b/nb/Gemma2_(2B)-Alpaca.ipynb
@@ -314,8 +314,8 @@
     "    # [NEW] \"unsloth\" uses 30% less VRAM, fits 2x larger batch sizes!\n",
     "    use_gradient_checkpointing = \"unsloth\", # True or \"unsloth\" for very long context\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     ")"
    ]
   },

diff --git a/nb/Gemma2_(9B)-Alpaca.ipynb b/nb/Gemma2_(9B)-Alpaca.ipynb
@@ -343,8 +343,8 @@
     "    # [NEW] \"unsloth\" uses 30% less VRAM, fits 2x larger batch sizes!\n",
     "    use_gradient_checkpointing = \"unsloth\", # True or \"unsloth\" for very long context\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     ")"
    ]
   },

diff --git a/nb/Gemma3N_(4B)-Audio.ipynb b/nb/Gemma3N_(4B)-Audio.ipynb
@@ -416,8 +416,8 @@
     "    lora_dropout = 0,\n",
     "    bias = \"none\",\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,               # We support rank stabilized LoRA\n",
-    "    loftq_config = None,               # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     "    target_modules = [\n",
     "        \"q_proj\", \"k_proj\", \"v_proj\", \"o_proj\",\n",
     "        \"gate_proj\", \"up_proj\", \"down_proj\",\n",

diff --git a/nb/Gemma3N_(4B)-Vision.ipynb b/nb/Gemma3N_(4B)-Vision.ipynb
@@ -474,8 +474,8 @@
     "    lora_dropout = 0,\n",
     "    bias = \"none\",\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,               # We support rank stabilized LoRA\n",
-    "    loftq_config = None,               # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     "    target_modules = \"all-linear\",    # Optional now! Can specify a list if needed\n",
     ")"
    ]

diff --git a/nb/Gemma3_(270M).ipynb b/nb/Gemma3_(270M).ipynb
@@ -364,8 +364,8 @@
     "    # [NEW] \"unsloth\" uses 30% less VRAM, fits 2x larger batch sizes!\n",
     "    use_gradient_checkpointing = \"unsloth\", # True or \"unsloth\" for very long context\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     ")"
    ]
   },

diff --git a/nb/Gemma3_(4B)-Vision-GRPO.ipynb b/nb/Gemma3_(4B)-Vision-GRPO.ipynb
@@ -448,8 +448,8 @@
     "    lora_dropout = 0,\n",
     "    bias = \"none\",\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     "    use_gradient_checkpointing = \"unsloth\", # Reduces memory usage\n",
     "    # target_modules = \"all-linear\", # Optional now! Can specify a list if needed\n",
     ")"

diff --git a/nb/Gemma3_(4B)-Vision.ipynb b/nb/Gemma3_(4B)-Vision.ipynb
@@ -396,8 +396,8 @@
     "    lora_dropout = 0,\n",
     "    bias = \"none\",\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,               # We support rank stabilized LoRA\n",
-    "    loftq_config = None,               # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     "    target_modules = \"all-linear\",    # Optional now! Can specify a list if needed\n",
     ")"
    ]

diff --git a/nb/Granite4.0.ipynb b/nb/Granite4.0.ipynb
@@ -196,8 +196,8 @@
     "    # [NEW] \"unsloth\" uses 30% less VRAM, fits 2x larger batch sizes!\n",
     "    use_gradient_checkpointing = \"unsloth\", # True or \"unsloth\" for very long context\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     ")"
    ]
   },

diff --git a/nb/Granite4.0_350M.ipynb b/nb/Granite4.0_350M.ipynb
@@ -366,8 +366,8 @@
     "    # [NEW] \"unsloth\" uses 30% less VRAM, fits 2x larger batch sizes!\n",
     "    use_gradient_checkpointing = \"unsloth\", # True or \"unsloth\" for very long context\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     ")"
    ]
   },

diff --git a/nb/HuggingFace Course-Gemma3_(4B)-Vision-GRPO.ipynb b/nb/HuggingFace Course-Gemma3_(4B)-Vision-GRPO.ipynb
@@ -450,8 +450,8 @@
     "    lora_dropout = 0,\n",
     "    bias = \"none\",\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     "    use_gradient_checkpointing = \"unsloth\", # Reduces memory usage\n",
     "    # target_modules = \"all-linear\", # Optional now! Can specify a list if needed\n",
     ")"

diff --git a/nb/HuggingFace Course-Qwen2_5_7B_VL_GRPO.ipynb b/nb/HuggingFace Course-Qwen2_5_7B_VL_GRPO.ipynb
@@ -619,8 +619,8 @@
     "    lora_dropout = 0,\n",
     "    bias = \"none\",\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     "    use_gradient_checkpointing = \"unsloth\", # Reduces memory usage\n",
     "    # target_modules = \"all-linear\", # Optional now! Can specify a list if needed\n",
     ")"

diff --git a/nb/HuggingFace Course-Qwen3_VL_(8B)-Vision-GRPO.ipynb b/nb/HuggingFace Course-Qwen3_VL_(8B)-Vision-GRPO.ipynb
@@ -558,8 +558,8 @@
     "    lora_dropout = 0,\n",
     "    bias = \"none\",\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     "    use_gradient_checkpointing = \"unsloth\", # Reduces memory usage\n",
     "    # target_modules = \"all-linear\", # Optional now! Can specify a list if needed\n",
     ")"

diff --git a/nb/HuggingFace Course-gpt-oss-(20B)_A100-GRPO.ipynb b/nb/HuggingFace Course-gpt-oss-(20B)_A100-GRPO.ipynb
@@ -765,8 +765,8 @@
     "    # [NEW] \"unsloth\" uses 30% less VRAM, fits 2x larger batch sizes!\n",
     "    use_gradient_checkpointing = \"unsloth\", # True or \"unsloth\" for very long context\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     ")"
    ]
   },

diff --git a/nb/Kaggle-CodeForces-cot-Finetune_for_Reasoning_on_CodeForces.ipynb b/nb/Kaggle-CodeForces-cot-Finetune_for_Reasoning_on_CodeForces.ipynb
@@ -253,8 +253,8 @@
     "    # [NEW] \"unsloth\" uses 30% less VRAM, fits 2x larger batch sizes!\n",
     "    use_gradient_checkpointing = \"unsloth\", # True or \"unsloth\" for very long context\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     ")"
    ]
   },

diff --git a/nb/Kaggle-CodeGemma_(7B)-Conversational.ipynb b/nb/Kaggle-CodeGemma_(7B)-Conversational.ipynb
@@ -153,8 +153,8 @@
     "    bias = \"none\",    # Supports any, but = \"none\" is optimized\n",
     "    use_gradient_checkpointing = \"unsloth\", # True or \"unsloth\" for very long context\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     ")"
    ]
   },

diff --git a/nb/Kaggle-Deepseek_OCR_(3B)-Eval.ipynb b/nb/Kaggle-Deepseek_OCR_(3B)-Eval.ipynb
@@ -541,8 +541,8 @@
     "    lora_dropout = 0,\n",
     "    bias = \"none\",\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     "    # target_modules = \"all-linear\", # Optional now! Can specify a list if needed\n",
     ")"
    ]

diff --git a/nb/Kaggle-Deepseek_OCR_(3B)-Evaluation.ipynb b/nb/Kaggle-Deepseek_OCR_(3B)-Evaluation.ipynb
@@ -694,8 +694,8 @@
     "    lora_dropout = 0,\n",
     "    bias = \"none\",\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     "    # target_modules = \"all-linear\", # Optional now! Can specify a list if needed\n",
     ")"
    ]

diff --git a/nb/Kaggle-Deepseek_OCR_(3B).ipynb b/nb/Kaggle-Deepseek_OCR_(3B).ipynb
@@ -541,8 +541,8 @@
     "    lora_dropout = 0,\n",
     "    bias = \"none\",\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     "    # target_modules = \"all-linear\", # Optional now! Can specify a list if needed\n",
     ")"
    ]

diff --git a/nb/Kaggle-ERNIE_4_5_21B_A3B_PT-Conversational.ipynb b/nb/Kaggle-ERNIE_4_5_21B_A3B_PT-Conversational.ipynb
@@ -618,8 +618,8 @@
     "    # [NEW] \"unsloth\" uses 30% less VRAM, fits 2x larger batch sizes!\n",
     "    use_gradient_checkpointing = \"unsloth\", # True or \"unsloth\" for very long context\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     ")"
    ]
   },

diff --git a/nb/Kaggle-ERNIE_4_5_VL_28B_A3B_PT_Vision.ipynb b/nb/Kaggle-ERNIE_4_5_VL_28B_A3B_PT_Vision.ipynb
@@ -875,7 +875,7 @@
     "    lora_dropout = 0,\n",
     "    bias = \"none\",\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
     "    target_modules = [\n",
     "        \"q_proj\", \"k_proj\", \"v_proj\", \"o_proj\",\n",
     "        \"gate_proj\", \"up_proj\", \"down_proj\",\n",

diff --git a/nb/Kaggle-Gemma2_(2B)-Alpaca.ipynb b/nb/Kaggle-Gemma2_(2B)-Alpaca.ipynb
@@ -314,8 +314,8 @@
     "    # [NEW] \"unsloth\" uses 30% less VRAM, fits 2x larger batch sizes!\n",
     "    use_gradient_checkpointing = \"unsloth\", # True or \"unsloth\" for very long context\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     ")"
    ]
   },

diff --git a/nb/Kaggle-Gemma2_(9B)-Alpaca.ipynb b/nb/Kaggle-Gemma2_(9B)-Alpaca.ipynb
@@ -343,8 +343,8 @@
     "    # [NEW] \"unsloth\" uses 30% less VRAM, fits 2x larger batch sizes!\n",
     "    use_gradient_checkpointing = \"unsloth\", # True or \"unsloth\" for very long context\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     ")"
    ]
   },

diff --git a/nb/Kaggle-Gemma3N_(4B)-Audio.ipynb b/nb/Kaggle-Gemma3N_(4B)-Audio.ipynb
@@ -416,8 +416,8 @@
     "    lora_dropout = 0,\n",
     "    bias = \"none\",\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,               # We support rank stabilized LoRA\n",
-    "    loftq_config = None,               # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     "    target_modules = [\n",
     "        \"q_proj\", \"k_proj\", \"v_proj\", \"o_proj\",\n",
     "        \"gate_proj\", \"up_proj\", \"down_proj\",\n",

diff --git a/nb/Kaggle-Gemma3N_(4B)-Vision.ipynb b/nb/Kaggle-Gemma3N_(4B)-Vision.ipynb
@@ -474,8 +474,8 @@
     "    lora_dropout = 0,\n",
     "    bias = \"none\",\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,               # We support rank stabilized LoRA\n",
-    "    loftq_config = None,               # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     "    target_modules = \"all-linear\",    # Optional now! Can specify a list if needed\n",
     ")"
    ]

diff --git a/nb/Kaggle-Gemma3_(270M).ipynb b/nb/Kaggle-Gemma3_(270M).ipynb
@@ -364,8 +364,8 @@
     "    # [NEW] \"unsloth\" uses 30% less VRAM, fits 2x larger batch sizes!\n",
     "    use_gradient_checkpointing = \"unsloth\", # True or \"unsloth\" for very long context\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     ")"
    ]
   },

diff --git a/nb/Kaggle-Gemma3_(4B)-Vision-GRPO.ipynb b/nb/Kaggle-Gemma3_(4B)-Vision-GRPO.ipynb
@@ -441,8 +441,8 @@
     "    lora_dropout = 0,\n",
     "    bias = \"none\",\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     "    use_gradient_checkpointing = \"unsloth\", # Reduces memory usage\n",
     "    # target_modules = \"all-linear\", # Optional now! Can specify a list if needed\n",
     ")"

diff --git a/nb/Kaggle-Gemma3_(4B)-Vision.ipynb b/nb/Kaggle-Gemma3_(4B)-Vision.ipynb
@@ -396,8 +396,8 @@
     "    lora_dropout = 0,\n",
     "    bias = \"none\",\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,               # We support rank stabilized LoRA\n",
-    "    loftq_config = None,               # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     "    target_modules = \"all-linear\",    # Optional now! Can specify a list if needed\n",
     ")"
    ]

diff --git a/nb/Kaggle-Granite4.0.ipynb b/nb/Kaggle-Granite4.0.ipynb
@@ -196,8 +196,8 @@
     "    # [NEW] \"unsloth\" uses 30% less VRAM, fits 2x larger batch sizes!\n",
     "    use_gradient_checkpointing = \"unsloth\", # True or \"unsloth\" for very long context\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     ")"
    ]
   },

diff --git a/nb/Kaggle-Granite4.0_350M.ipynb b/nb/Kaggle-Granite4.0_350M.ipynb
@@ -366,8 +366,8 @@
     "    # [NEW] \"unsloth\" uses 30% less VRAM, fits 2x larger batch sizes!\n",
     "    use_gradient_checkpointing = \"unsloth\", # True or \"unsloth\" for very long context\n",
     "    random_state = 3407,\n",
-    "    use_rslora = False,  # We support rank stabilized LoRA\n",
-    "    loftq_config = None, # And LoftQ\n",
+    "    use_rslora = False,  # rsLoRA: For correct scaling, set alpha ~ sqrt(r) if True.\n",
+    "    loftq_config = None,  # We support LoftQ\n",
     ")"
    ]
   },