From 0199d913728f8a38f86853caaa53654de84cc073 Mon Sep 17 00:00:00 2001
From: RossAscends <124905043+RossAscends@users.noreply.github.com>
Date: Wed, 3 Jan 2024 17:29:42 +0900
Subject: [PATCH 1/5] Update dropdown.html

---
 dropdown.html | 41 ++++++++++++++++++++++++++---------------
 1 file changed, 26 insertions(+), 15 deletions(-)
diff --git a/dropdown.html b/dropdown.html
index 5e03422..85ee761 100644
--- a/dropdown.html
+++ b/dropdown.html
@@ -26,33 +26,44 @@ <h4 data-i18n="Configuration">Configuration</h4>
             </div>
 
             <hr />
-            <div class="flex-container">
+            <div class="flex-container justifySpaceBetween">
                 <h4 data-i18n="Tabby API key">Model Select</h4>
                 <div id="reload_model_list_button" title="Refresh model list" data-i18n="[title]Refresh model list" class="menu_button fa-lg fa-solid fa-repeat"></div>
+
+                <div id="open_parameter_editor" class="menu_button">
+                    <i class="fa-solid fa-pen-to-square"></i>
+                    <span>Open Editor</span>
+                </div>
             </div>
 
             <small>Make sure an admin key is set to avoid errors.</small>
             <div class="flex-container flexFlowColumn">
                 <input id="model_list" name="model_list" class="text_pole flex1 wide100p" placeholder="Model name here" maxlength="100" size="35" value="" autocomplete="off">
                 <input id="draft_model_list" name="draft_model_list" class="text_pole flex1 wide100p" placeholder="Draft model name here" maxlength="100" size="35" value="" autocomplete="off">
-            </div>
-            <div id="loading_progress_container" class="progress_container">
-                <div id="loading_progressbar"></div>
-            </div>
-
-            <div class="flex-container">
-                <input id="load_model_button" class="menu_button" type="submit" value="Load" />
-                <input id="unload_model_button" class="menu_button" type="button" value="Unload" />
+                <div id="loading_progress_container" class="progress_container">
+                    <div id="loading_progressbar"></div>
+                </div>
+                <div class="flex-container">
+                    <input id="load_model_button" class="menu_button" type="submit" value="Load Model(& Draft)" />
+                    <input id="unload_model_button" class="menu_button" type="button" value="Unload Model & Draft" />
 
-                <div id="open_parameter_editor" class="menu_button">
-                    <i class="fa-solid fa-pen-to-square"></i>
-                    <span>Open Editor</span>
                 </div>
+                <div class="flex-container flexFlowColumn">
+                    <input id="lora_model_list" name="lora_model_list" class="text_pole flex1 wide100p" placeholder="Lora name here" maxlength="100" size="30" value="" autocomplete="off">
+                    <div id="loraLoadingNotification">Loading Lora.....<i class="fa-solid fa-spinner fa-spin"></i></div>
+                    <div class="flex-container">
+                        <input id="load_lora_button" class="menu_button" type="submit" value="Load Lora" />
+                        <input id="unload_lora_button" class="menu_button" type="button" value="Unload Lora" />
+                    </div>
+                </div>
+
+
+
+
+                <hr class="sysHR" />
             </div>
-            <hr class="sysHR" />
-        </div>
 
 
+        </div>
     </div>
 </div>
-</div>

From 52681152f7984bb072cc1bf19d5d12d04fd133f5 Mon Sep 17 00:00:00 2001
From: RossAscends <124905043+RossAscends@users.noreply.github.com>
Date: Wed, 3 Jan 2024 17:29:57 +0900
Subject: [PATCH 2/5] Update index.js

---
 index.js | 187 +++++++++++++++++++++++++++++++++++++++++++++++++------
 1 file changed, 168 insertions(+), 19 deletions(-)

diff --git a/index.js b/index.js
index c7c2864..3dfe14e 100644
--- a/index.js
+++ b/index.js
@@ -16,6 +16,10 @@ const defaultSettings = {};
 // Cached models list
 let models = [];
 let draftModels = [];
+let loraModels = [];
+let loraReqBody = {};
+let shouldLoadLora = false;
+
 
 // Check if user is connected to TabbyAPI
 function verifyTabby(logError = true) {
@@ -74,7 +78,7 @@ async function fetchModels() {
         console.error('TabbyLoader: Could not connect to TabbyAPI');
         return;
     }
-    var models, draftModels;
+    var models, draftModels, loraModels;
     // Remove trailing URL slash
     const apiUrl = getTabbyURL();
     try {
@@ -105,10 +109,23 @@ async function fetchModels() {
         if (draftModelListResponse.ok) {
             draftModels = await draftModelListResponse.json();
         } else {
-            console.error(`Request to /v1/model/list failed with a statuscode of ${response.status}:\n${response.statusText}`);
+            console.error(`Request to /v1/model/draft/list failed with a statuscode of ${response.status}:\n${response.statusText}`);
+            return [];
+        }
+
+        const loraModelListResponse = await fetch(`${apiUrl}/v1/lora/list`, {
+            headers: {
+                'X-api-key': authToken,
+            },
+        });
+
+        if (loraModelListResponse.ok) {
+            loraModels = await loraModelListResponse.json();
+        } else {
+            console.error(`Request to /v1/lora/list failed with a statuscode of ${response.status}:\n${response.statusText}`);
             return [];
         }
-        return [models.data.map((e) => e.id), draftModels.data.map((e) => e.id)];
+        return [models.data.map((e) => e.id), draftModels.data.map((e) => e.id), loraModels.data.map((e) => e.id)];
     } catch (error) {
         console.error(error);
 
@@ -124,6 +141,7 @@ async function onLoadModelClick() {
 
     const modelValue = $('#model_list').val();
     const draftModelValue = $('#draft_model_list').val();
+    const loraModelValue = $('#lora_model_list').val();
 
     if (!modelValue || !models.includes(modelValue)) {
         toastr.error('TabbyLoader: Please make sure the model name is spelled correctly before loading!');
@@ -131,11 +149,16 @@ async function onLoadModelClick() {
         return;
     }
 
-    if (draftModelValue !== '' && !models.includes(draftModelValue)) {
+    if (draftModelValue !== '' && !draftModels.includes(draftModelValue)) {
         toastr.error('TabbyLoader: Please make sure the draft model name is spelled correctly before loading!');
         return;
     }
 
+    if (loraModelValue !== '' && !loraModels.includes(loraModelValue)) {
+        toastr.error('TabbyLoader: Please make sure the lora name is spelled correctly before loading!');
+        return;
+    }
+
     const tabbyURL = getTabbyURL();
 
     const body = {
@@ -146,6 +169,7 @@ async function onLoadModelClick() {
         no_flash_attention: extensionSettings?.modelParams?.noFlashAttention,
         gpu_split_auto: extensionSettings?.modelParams?.gpuSplitAuto,
         cache_mode: extensionSettings?.modelParams?.eightBitCache ?? false ? 'FP8' : 'FP16',
+        use_cfg: extensionSettings?.modelParams?.useCfg,
     };
 
     if (draftModelValue) {
@@ -175,7 +199,7 @@ async function onLoadModelClick() {
 
         return;
     }
-    console.log(body);
+
     try {
         const response = await fetch(`${tabbyURL}/v1/model/load`, {
             method: 'POST',
@@ -187,7 +211,6 @@ async function onLoadModelClick() {
             body: JSON.stringify(body),
         });
 
-        console.log(response);
         if (response.ok) {
             const eventStream = new EventSourceStream();
             response.body.pipeThrough(eventStream);
@@ -195,11 +218,16 @@ async function onLoadModelClick() {
             const progressContainer = $('#loading_progress_container').hide();
             progressContainer.show();
             let soFar = 0;
-            let times;
-            draftModelValue ? times = 2 : times = 1;
+            let times = 1;
+
+            if (draftModelValue) { times++; }
+            if (loraModelValue) { times++; }
+
+            console.debug(`TabbyLoader: need to loop ${times} times`);
+
             while (true) {
                 const { value, done } = await reader.read();
-                console.log(soFar, times);
+                console.debug(`TabbyLoader: On loop ${soFar} of ${times}`);
                 if (done && soFar === times) break;
 
                 const packet = JSON.parse(value.data);
@@ -208,12 +236,18 @@ async function onLoadModelClick() {
                 const percent = numerator / denominator * 100;
 
                 if (packet.status === 'finished') {
-                    if (soFar === times - 1) {
+                    if (times === 1) {
                         progressContainer.hide();
                         toastr.info('TabbyLoader: Model loaded');
-                    } else {
+                        break;
+                    }
+                    if (soFar === times - 2 && times === 2) { // model+draft
                         $('#loading_progressbar').progressbar('value', 0);
                         toastr.info('TabbyLoader: Draft Model loaded');
+                    } else if (times === 2) {
+                        progressContainer.hide();
+                        toastr.info('TabbyLoader: Model loaded');
+                        break;
                     }
                     soFar++;
                 } else {
@@ -223,7 +257,7 @@ async function onLoadModelClick() {
         } else {
             const responseJson = await response.json();
             console.error('TabbyLoader: Could not load the model because:\n', responseJson?.detail ?? response.statusText);
-            toastr.error('TabbyLoader: Could not load the model. Please check the JavaScript or TabbyAPI console for details.');
+            toastr.error(`TabbyLoader: Could not load the model because: ${responseJson?.detail ?? response.statusText}`);
         }
     } catch (error) {
         console.error('TabbyLoader: Could not load the model because:\n', error);
@@ -234,6 +268,75 @@ async function onLoadModelClick() {
     }
 }
 
+async function loadLora() {
+    const loraModelValue = $('#lora_model_list').val();
+    if (!loraModelValue) {
+        toastr.error("TabbyLoader: No lora selected!");
+        return;
+    }
+    const tabbyURL = getTabbyURL();
+    const authToken = await getTabbyAuth();
+    if (!authToken) {
+        // eslint-disable-next-line
+        toastr.error("TabbyLoader: Admin key not found. Please provide one in SillyTavern's model settings or in the extension box.");
+        return;
+    }
+
+    loraReqBody.loras = [
+        {
+            name: loraModelValue,
+            scaling: extensionSettings?.loraAPICallParams?.lora.scaling,
+        },
+    ];
+
+    $('#loraLoadingNotification').show();
+    const response = await fetch(`${tabbyURL}/v1/lora/load`, {
+        method: 'POST',
+        credentials: 'include',
+        headers: {
+            ...getRequestHeaders(),
+            'X-admin-key': authToken,
+        },
+        body: JSON.stringify(loraReqBody),
+    });
+
+    if (response.ok) {
+        toastr.info('TabbyLoader: Lora loaded');
+
+    } else {
+        const responseJson = await response.json();
+        console.error('TabbyLoader: Could not load the lora because:\n', responseJson?.detail ?? response.statusText);
+        toastr.error(`TabbyLoader: Could not load the lora because: ${responseJson?.detail ?? response.statusText}`);
+    }
+    $('#loraLoadingNotification').hide();
+    shouldLoadLora = false;
+}
+
+async function unloadLora() {
+    verifyTabby();
+    const tabbyURL = getTabbyURL();
+
+    const authToken = await getTabbyAuth();
+    if (!authToken) {
+        return;
+    }
+
+    const response = await fetch(`${tabbyURL}/v1/lora/unload`, {
+        method: 'GET',
+        headers: {
+            'X-admin-key': authToken,
+        },
+    });
+
+    if (response.ok) {
+        toastr.info('TabbyLoader: Lora unloaded');
+    } else {
+        const responseJson = await response.json();
+        console.error('TabbyLoader: Could not unload the lora because:\n', responseJson?.detail ?? response.statusText);
+        toastr.error(`TabbyLoader: Could not unload the lora because: ${responseJson?.detail ?? response.statusText}`);
+    }
+}
+
 async function onUnloadModelClick() {
     verifyTabby();
     const tabbyURL = getTabbyURL();
@@ -255,7 +358,7 @@ async function onUnloadModelClick() {
     } else {
         const responseJson = await response.json();
         console.error('TabbyLoader: Could not unload the model because:\n', responseJson?.detail ?? response.statusText);
-        toastr.error('Could not unload the model. Please check the JavaScript or TabbyAPI console for details.');
+        toastr.error(`Could not unload the model because: ${responseJson?.detail ?? response.statusText}`);
     }
 }
 
@@ -276,12 +379,18 @@ async function onParameterEditorClick() {
     parameterHtml
         .find('input[name="draft_rope_alpha"]')
         .val(extensionSettings?.modelParams?.draft?.draft_ropeAlpha ?? 1.0);
+    parameterHtml
+        .find('input[name="lora_scale"]')
+        .val(extensionSettings?.modelParams?.lora?.scaling ?? 1.0);
     parameterHtml
         .find('input[name="no_flash_attention"]')
         .prop('checked', extensionSettings?.modelParams?.noFlashAttention ?? false);
     parameterHtml
         .find('input[name="eight_bit_cache"]')
         .prop('checked', extensionSettings?.modelParams?.eightBitCache ?? false);
+    parameterHtml
+        .find('input[name="use_cfg"]')
+        .prop('checked', extensionSettings?.modelParams?.useCfg ?? false);
 
     // MARK: GPU split options
     const gpuSplitAuto = extensionSettings?.modelParams?.gpuSplitAuto ?? true;
@@ -312,11 +421,19 @@ async function onParameterEditorClick() {
             noFlashAttention: parameterHtml.find('input[name="no_flash_attention"]').prop('checked'),
             gpuSplitAuto: parameterHtml.find('input[name="gpu_split_auto"]').prop('checked'),
             eightBitCache: parameterHtml.find('input[name="eight_bit_cache"]').prop('checked'),
+            useCfg: parameterHtml.find('input[name="use_cfg"]').prop('checked'),
+        };
+
+        const loraAPICallParams = {
+            loras: {
+                name: parameterHtml.find('input[name="lora_model_list"]').val(),
+                scaling: parameterHtml.find('input[name="lora_scale"]').val(),
+            },
         };
 
         // Handle GPU split setting
         const gpuSplitVal = parameterHtml.find('input[name="gpu_split_value"]').val();
-        try { 
+        try {
             const gpuSplitArray = JSON.parse(gpuSplitVal) ?? [];
             if (Array.isArray(gpuSplitArray)) {
                 newParams['gpuSplit'] = gpuSplitArray;
@@ -329,7 +446,7 @@ async function onParameterEditorClick() {
             newParams['gpuSplit'] = [];
         }
 
-        Object.assign(extensionSettings, { modelParams: newParams });
+        Object.assign(extensionSettings, { modelParams: newParams, loraParams: loraAPICallParams });
         saveSettingsDebounced();
     }
 }
@@ -356,8 +473,9 @@ jQuery(async () => {
     // This is an example of loading HTML from a file
     const settingsHtml = await $.get(`${extensionFolderPath}/dropdown.html`);
     let allmodels = await fetchModels();
-    models = allmodels[0]
-    draftModels = allmodels[1]
+    models = allmodels[0];
+    draftModels = allmodels[1];
+    loraModels = allmodels[2];
 
     // Append settingsHtml to extensions_settings
     // extension_settings and extensions_settings2 are the left and right columns of the settings menu
@@ -394,6 +512,21 @@ jQuery(async () => {
                 );
         });
 
+    $('#lora_model_list')
+        .autocomplete({
+            source: (_, response) => {
+                return response(loraModels);
+            },
+            minLength: 0,
+        })
+        .focus(function () {
+            $(this)
+                .autocomplete(
+                    'search',
+                    $(this).val(),
+                );
+        });
+
     // These are examples of listening for events
     $('#load_model_button').on('click', function () {
         if (verifyTabby()) {
@@ -407,11 +540,25 @@ jQuery(async () => {
         }
     });
 
+    $('#load_lora_button').on('click', function () {
+        if (verifyTabby()) {
+            loadLora();
+        }
+    });
+
+    $('#unload_lora_button').on('click', function () {
+        if (verifyTabby()) {
+            unloadLora();
+        }
+    });
+
+
     $('#reload_model_list_button').on('click', async function () {
         if (verifyTabby()) {
             let allmodels = await fetchModels();
-            models = allmodels[0]
-            draftModels = allmodels[1]
+            models = allmodels[0];
+            draftModels = allmodels[1];
+            loraModels = allmodels[2];
         }
     });
 
@@ -448,6 +595,8 @@ jQuery(async () => {
         onParameterEditorClick();
     });
 
+    $('#loraLoadingNotification').hide();
+
     // Load settings when starting things up (if you have any)
     await loadSettings();
 });

From 799f3a539d4c3beb029205fe4a1abdd1f14f25c0 Mon Sep 17 00:00:00 2001
From: RossAscends <124905043+RossAscends@users.noreply.github.com>
Date: Wed, 3 Jan 2024 17:30:09 +0900
Subject: [PATCH 3/5] Update modelParameters.html

---
 modelParameters.html | 44 ++++++++++++++++++++++++++++++++------------
 1 file changed, 32 insertions(+), 12 deletions(-)

diff --git a/modelParameters.html b/modelParameters.html
index b79d719..be08057 100644
--- a/modelParameters.html
+++ b/modelParameters.html
@@ -33,22 +33,38 @@ <h3><strong data-i18n="">Set Parameters</strong>
                 <input name="rope_alpha" class="text_pole" type="text" />
             </div>
         </div>
-        Draft Model
         <div class="flex-container">
-            <div class="flex1">
-                <label for="rope_scale">
-                    <small data-i18n="Rope Scale">Rope Scale</small>
-                </label>
-                <input name="draft_rope_scale" class="text_pole" type="text" />
+            <div class="flex-container flex1 flexFlowColumn">
+                Draft Model
+                <div class="flex-container">
+                    <div class="flex1">
+                        <label for="rope_scale">
+                            <small data-i18n="Rope Scale">Rope Scale</small>
+                        </label>
+                        <input name="draft_rope_scale" class="text_pole" type="text" />
+                    </div>
+                    <div class="flex1">
+                        <label for="rope_alpha">
+                            <small data-i18n="Rope Alpha">Rope Alpha</small>
+                        </label>
+                        <input name="draft_rope_alpha" class="text_pole" type="text" />
+                    </div>
+                </div>
             </div>
-            <div class="flex1">
-                <label for="rope_alpha">
-                    <small data-i18n="Rope Alpha">Rope Alpha</small>
-                </label>
-                <input name="draft_rope_alpha" class="text_pole" type="text" />
+            <div class="flex-container flex1 flexFlowColumn">
+                Lora
+                <div class="flex-container flex1">
+                    <div class="flex1">
+                        <label for="rope_scale">
+                            <small data-i18n="Rope Scale">Lora Strength</small>
+                        </label>
+                        <input id="lora_scale" name="lora_scale" class="text_pole flex1 wide100p" placeholder="Integer Required" maxlength="100" size="5" min="0" max="10" value="">
+                    </div>
+                </div>
             </div>
         </div>
 
+
         <!-- Container for GPU Split and other options -->
         <div class="flex-container">
             <div class="flex-container flexFlowColumn flexNoGap alignitemsstart">
@@ -68,7 +84,11 @@ <h3><strong data-i18n="">Set Parameters</strong>
                 </label>
                 <label class="checkbox flex-container">
                     <input type="checkbox" name="eight_bit_cache" />
-                    <span data-i18n="Disable FA2">8-bit Cache</span>
+                    <span data-i18n="8-bit Cache">8-bit Cache</span>
+                </label>
+                <label class="checkbox flex-container">
+                    <input type="checkbox" name="use_cfg" />
+                    <span data-i18n="Use CFG">Use CFG</span>
                 </label>
             </div>
         </div>

From 051b4b60aa3d64c352b3ab308700dd8a12d9546f Mon Sep 17 00:00:00 2001
From: RossAscends <124905043+RossAscends@users.noreply.github.com>
Date: Wed, 3 Jan 2024 17:40:51 +0900
Subject: [PATCH 4/5] don't count lora input for loop times..

---
 index.js | 1 -
 1 file changed, 1 deletion(-)

diff --git a/index.js b/index.js
index 3dfe14e..4ec4fba 100644
--- a/index.js
+++ b/index.js
@@ -221,7 +221,6 @@ async function onLoadModelClick() {
             let times = 1;
 
             if (draftModelValue) { times++; }
-            if (loraModelValue) { times++; }
 
             console.debug(`TabbyLoader: need to loop ${times} times`);
 

From 7aa8789ffe179d05e49d317079579ec5c2c09653 Mon Sep 17 00:00:00 2001
From: RossAscends <124905043+RossAscends@users.noreply.github.com>
Date: Wed, 3 Jan 2024 18:01:29 +0900
Subject: [PATCH 5/5] fix lora scaling var save/load, gracefully handle empty
 GPU split

---
 index.js | 32 +++++++++++++++++---------------
 1 file changed, 17 insertions(+), 15 deletions(-)

diff --git a/index.js b/index.js
index 4ec4fba..73b4dcc 100644
--- a/index.js
+++ b/index.js
@@ -18,6 +18,7 @@ let models = [];
 let draftModels = [];
 let loraModels = [];
 let loraReqBody = {};
+let loraAPICallParams;
 let shouldLoadLora = false;
 
 
@@ -280,11 +281,10 @@ async function loadLora() {
         toastr.error("TabbyLoader: Admin key not found. Please provide one in SillyTavern's model settings or in the extension box.");
         return;
     }
-
     loraReqBody.loras = [
         {
             name: loraModelValue,
-            scaling: extensionSettings?.loraAPICallParams?.lora.scaling,
+            scaling: extensionSettings?.loraParams?.loras.scaling,
         },
     ];
 
@@ -380,7 +380,7 @@ async function onParameterEditorClick() {
         .val(extensionSettings?.modelParams?.draft?.draft_ropeAlpha ?? 1.0);
     parameterHtml
         .find('input[name="lora_scale"]')
-        .val(extensionSettings?.modelParams?.lora?.scaling ?? 1.0);
+        .val(extensionSettings?.loraParams?.loras.scaling ?? 1.0);
     parameterHtml
         .find('input[name="no_flash_attention"]')
         .prop('checked', extensionSettings?.modelParams?.noFlashAttention ?? false);
@@ -422,8 +422,8 @@ async function onParameterEditorClick() {
             eightBitCache: parameterHtml.find('input[name="eight_bit_cache"]').prop('checked'),
             useCfg: parameterHtml.find('input[name="use_cfg"]').prop('checked'),
         };
-
-        const loraAPICallParams = {
+        console.log(parameterHtml.find('input[name="lora_scale"]').val())
+        loraAPICallParams = {
             loras: {
                 name: parameterHtml.find('input[name="lora_model_list"]').val(),
                 scaling: parameterHtml.find('input[name="lora_scale"]').val(),
@@ -433,20 +433,22 @@ async function onParameterEditorClick() {
         // Handle GPU split setting
         const gpuSplitVal = parameterHtml.find('input[name="gpu_split_value"]').val();
         try {
-            const gpuSplitArray = JSON.parse(gpuSplitVal) ?? [];
-            if (Array.isArray(gpuSplitArray)) {
-                newParams['gpuSplit'] = gpuSplitArray;
-            } else {
-                console.error(`Provided GPU split value (${gpuSplitArray}) is not an array.`);
-                newParams['gpuSplit'] = [];
+            if (gpuSplitVal) {
+                const gpuSplitArray = JSON.parse(gpuSplitVal) ?? [];
+                if (Array.isArray(gpuSplitArray)) {
+                    newParams['gpuSplit'] = gpuSplitArray;
+                } else {
+                    console.error(`Provided GPU split value (${gpuSplitArray}) is not an array.`);
+                    newParams['gpuSplit'] = [];
+                }
             }
-        } catch (error) {
+            Object.assign(extensionSettings, { modelParams: newParams, loraParams: loraAPICallParams });
+            saveSettingsDebounced();
+        }
+        catch (error) {
             console.error(error);
             newParams['gpuSplit'] = [];
         }
-
-        Object.assign(extensionSettings, { modelParams: newParams, loraParams: loraAPICallParams });
-        saveSettingsDebounced();
     }
 }