improve model selector (#107)

jinhongyii · web-flow · commit 2d088ea91d71 · 2023-05-21T23:03:22.000-07:00
1. clear all chat history when switching model
2. ban user input model url temporarily
diff --git a/site/_includes/llm_chat.html b/site/_includes/llm_chat.html
@@ -22,20 +22,20 @@
     }
   }
 </script>
-<!-- 
+
 <form>
-  <select id="model-name">
-    <option selected="selected">vicuna-v1-7b-q4f32_0</option>
-    <option >RedPajama-INCITE-Chat-3B-v1-q4f32_0</option>
+  <select id="model">
+    <option >vicuna-v1-7b-q4f32_0</option>
+    <option selected="selected">RedPajama-INCITE-Chat-3B-v1-q4f32_0</option>
   </select>
-</form> -->
+</form>
 
-<label>Pick a pre-compiled model or load your own model's mlc-chat-config.json:
+<!-- <label>Pick a pre-compiled model or load your own model's mlc-chat-config.json:
   <input list="model-names" name="model" id="model"/></label>
 <datalist id="model-names">
   <option value="vicuna-v1-7b-q4f32_0" ></option>
   <option value="RedPajama-INCITE-Chat-3B-v1-q4f32_0"></option>
-</datalist>
+</datalist> -->
 
 <script src="dist/llm_chat.js"></script>
 <link href="dist/llm_chat.css" rel="stylesheet" type="text/css"/>
diff --git a/site/index.md b/site/index.md
@@ -22,22 +22,22 @@ Won’t it be even more amazing if we can simply open up a browser and directly
 
 ## Instructions
 
-WebGPU just shipped to Chrome and is in beta. We do our experiments in [Chrome Canary](https://www.google.com/chrome/canary/).  You can also try out the latest Chrome 113. Chrome version ≤ 112 is not supported, and if you are using it, the demo will raise an error like `Find an error initializing the WebGPU device OperationError: Required limit (1073741824) is greater than the supported limit (268435456). - While validating maxBufferSize - While validating required limits.`
-We have tested it on windows and mac, you will need a gpu with about 6.4G memory.
+WebGPU just shipped to Chrome. You can try out the latest Chrome 113. Chrome version ≤ 112 is not supported, and if you are using it, the demo will raise an error like `Find an error initializing the WebGPU device OperationError: Required limit (1073741824) is greater than the supported limit (268435456). - While validating maxBufferSize - While validating required limits.`
+We have tested it on Windows and Mac, you will need a GPU with about 6GB memory to run Vicuna-7B and about 3GB memory to run RedPajama-3B.
 
 If you have a Mac computer with Apple silicon, here are the instructions for you to run the chatbot demo on your browser locally:
 
-- Install [Chrome Canary](https://www.google.com/chrome/canary/), a developer version of Chrome that enables the use of WebGPU.
-- Launch Chrome Canary. You are recommended to launch from terminal with the following command (or replace Chrome Canary with Chrome):
+- Upgrade Chrome to version ≥ 113.
+- Launch Chrome. You are recommended to launch from terminal with the following command:
   ```
-  /Applications/Google\ Chrome\ Canary.app/Contents/MacOS/Google\ Chrome\ Canary --enable-dawn-features=disable_robustness
+  /Applications/Google\ Chrome.app/Contents/MacOS/Google\ Chrome --enable-dawn-features=disable_robustness
   ```
-  This command turns off the robustness check from Chrome Canary that slows down chatbot reply to times. It is not necessary, but we strongly recommend you to start Chrome with this command.
-- Enter your inputs, click “Send” – we are ready to go! The chat bot will first fetch model parameters into local cache. The download may take a few minutes, only for the first run. The subsequent refreshes and runs will be faster.
+  This command turns off the robustness check from Chrome that slows down chatbot reply to times. It is not necessary, but we strongly recommend you to start Chrome with this command.
+- Select the model you want to try out. Enter your inputs, click “Send” – we are ready to go! The chat bot will first fetch model parameters into local cache. The download may take a few minutes, only for the first run. The subsequent refreshes and runs will be faster.
 
 ## Chat Demo
 
-The chat demo is based on [vicuna-7b-v1.1](https://huggingface.co/lmsys/vicuna-7b-delta-v1.1) model and [RedPajama-INCITE-Chat-3B-v1](https://huggingface.co/togethercomputer/RedPajama-INCITE-Chat-3B-v1) model . More model support are on the way.
+The chat demo is based on [vicuna-7b-v1.1](https://huggingface.co/lmsys/vicuna-7b-delta-v1.1) model and [RedPajama-INCITE-Chat-3B-v1](https://huggingface.co/togethercomputer/RedPajama-INCITE-Chat-3B-v1) model. More model supports are on the way.
 
 {% include llm_chat.html %}
 
@@ -48,4 +48,4 @@ The chat demo is based on [vicuna-7b-v1.1](https://huggingface.co/lmsys/vicuna-7
 
 ## Disclaimer
 
-This demo site is for research purposes only, subject to the model License of LLaMA and Vicuna. Please contact us if you find any potential violation.
+This demo site is for research purposes only, subject to the model License of LLaMA, Vicuna and RedPajama. Please contact us if you find any potential violation.
diff --git a/web/llm_chat.html b/web/llm_chat.html
@@ -22,20 +22,20 @@
     }
   }
 </script>
-<!-- 
+
 <form>
-  <select id="model-name">
-    <option selected="selected">vicuna-v1-7b-q4f32_0</option>
-    <option >RedPajama-INCITE-Chat-3B-v1-q4f32_0</option>
+  <select id="model">
+    <option >vicuna-v1-7b-q4f32_0</option>
+    <option selected="selected">RedPajama-INCITE-Chat-3B-v1-q4f32_0</option>
   </select>
-</form> -->
+</form>
 
-<label>Pick a pre-compiled model or load your own model's mlc-chat-config.json:
+<!-- <label>Pick a pre-compiled model or load your own model's mlc-chat-config.json:
   <input list="model-names" name="model" id="model"/></label>
 <datalist id="model-names">
   <option value="vicuna-v1-7b-q4f32_0" ></option>
   <option value="RedPajama-INCITE-Chat-3B-v1-q4f32_0"></option>
-</datalist>
+</datalist> -->
 
 <script src="dist/llm_chat.js"></script>
 <link href="dist/llm_chat.css" rel="stylesheet" type="text/css"/>
diff --git a/web/llm_chat.js b/web/llm_chat.js
@@ -494,11 +494,12 @@ class LLMChatInstance {
     this.uiChatInput = undefined;
     this.logger = console.log;
     this.debugTest = false;
-    this.model = "vicuna-v1-7b-q4f32_0";
+    this.model = "RedPajama-INCITE-Chat-3B-v1-q4f32_0";
 
   }
 
   reboot() {
+    this.resetChat();
     this.config = undefined;
     this.pipeline = undefined;
     if (this.tvm !== undefined) {