Spaces:

lmz
/

candle-llama2

Running

radames commited on Sep 6, 2023

Commit

669c701

1 Parent(s): 1f57ad2

force cache with cache API and fix max seq (#2)

- force cache with cache API and fix max seq (c2a511e0225b51fa9cb3c772501b002126ece76a)

Co-authored-by: Radamés Ajna <radames@users.noreply.huggingface.co>

Files changed (2) hide show

index.html CHANGED Viewed

@@ -38,11 +38,11 @@
         },
         stories42M: {
           url: "stories42M.bin",
-          seq_len: 256,
         },
         stories110M: {
           url: "stories110M.bin",
-          seq_len: 256,
         },
       };
@@ -124,9 +124,17 @@
       const prompt = document.querySelector("#prompt");
       const clearBtn = document.querySelector("#clear-btn");
       const runBtn = document.querySelector("#run");
       let runController = new AbortController();
       let isRunning = false;
       form.addEventListener("submit", async (e) => {
         e.preventDefault();
         if (isRunning) {

         },
         stories42M: {
           url: "stories42M.bin",
+          seq_len: 1024,
         },
         stories110M: {
           url: "stories110M.bin",
+          seq_len: 1024,
         },
       };
       const prompt = document.querySelector("#prompt");
       const clearBtn = document.querySelector("#clear-btn");
       const runBtn = document.querySelector("#run");
+      const modelSelect = document.querySelector("#model");
       let runController = new AbortController();
       let isRunning = false;
+      modelSelect.addEventListener("change", (e) => {
+        const model = MODELS[e.target.value];
+        document.querySelector("#max-seq").max = model.seq_len;
+        document.querySelector("#max-seq").nextElementSibling.value =
+          model.seq_len;
+      });
       form.addEventListener("submit", async (e) => {
         e.preventDefault();
         if (isRunning) {

llama2cWorker.js CHANGED Viewed

@@ -1,13 +1,17 @@
 import init, { Model } from "./build/m.js";
 async function fetchArrayBuffer(url) {
-  const res = await fetch(url, {
-    cache: "force-cache",
-  });
-  const data = await res.arrayBuffer();
-  return new Uint8Array(data);
 }
 class Llama2C {
   static instance = {};

 import init, { Model } from "./build/m.js";
 async function fetchArrayBuffer(url) {
+  const cacheName = "llama2c-candle-cache";
+  const cache = await caches.open(cacheName);
+  const cachedResponse = await cache.match(url);
+  if (cachedResponse) {
+    const data = await cachedResponse.arrayBuffer();
+    return new Uint8Array(data);
+  }
+  const res = await fetch(url, { cache: "force-cache" });
+  cache.put(url, res.clone());
+  return new Uint8Array(await res.arrayBuffer());
 }
 class Llama2C {
   static instance = {};