Everything is working

dakenf · Jul 17, 2023 · 13cf369 · 13cf369
1 parent ac87020
commit 13cf369
Show file tree

Hide file tree

Showing 5 changed files with 36 additions and 7 deletions.
diff --git a/ort-wasm-handler.js b/ort-wasm-handler.js
@@ -2,7 +2,7 @@ const fs = require("fs");
 const path = require("path");
 
 // copy onnxruntime-web WebAssembly files to public/ folder
-const srcFolder = path.join(__dirname, "node_modules", "onnxruntime-web", "dist");
+const srcFolder = path.join(__dirname, "node_modules", "@aislamov/onnxruntime-web64", "dist");
 const destFolder = path.join(__dirname, "public", "static", "js");
 
 if (fs.existsSync('./node_modules/.cache')) {

diff --git a/package-lock.json b/package-lock.json
diff --git a/package.json b/package.json
@@ -15,6 +15,7 @@
     "@types/react": "^18.2.8",
     "@types/react-dom": "^18.2.4",
     "@xenova/transformers": "^2.4.1",
+    "@aislamov/onnxruntime-web64": "^0.0.3",
     "http-proxy-middleware": "^2.0.6",
     "lodash": "^4.17.21",
     "onnxruntime-web": "^1.15.1",

diff --git a/src/App.tsx b/src/App.tsx
@@ -59,11 +59,13 @@ function FAQ () {
         <ListItem>
           <h2>FAQ</h2>
         </ListItem>
+        <FaqItem question={'What if I get protobuf parsing failed error?'} answer={'Open DevTools, go to Application -> Storage and press "Clear site data".'} />
+        <FaqItem question={'What if I get sbox_fatal_memory_exceeded?'} answer={"You don't have enough RAM to run SD. You can try reloading the tab or browser."} />
         <FaqItem question={'How did you make it possible?'} answer={'In order to run it, I had to port StableDiffusionPipeline from python to JS. Then patch onnxruntime and emscripten+binaryen (WebAssembly compiler toolchain) to support allocating and using >4GB memory. Once my pull requests get to release, anyone would be able to compile and run code that uses >4GB in the browser.'} />
         <FaqItem question={'Why is it so slow?'} answer={'It does not support multi-threading yet, so is using just one CPU core. There is no way to create 64 bit memory with SharedArrayBuffer through WebAssembly.Memory constructor. I’ve proposed a spec change to have “memory64” flag and after it’s accepted, i will patch V8 engine to support it.'} />
         <FaqItem question={'But it’s running on a GPU, right?'} answer={'Yes, but webgpu is onnxruntime is in early stage, so a lot of operations are not yet implemented. And data is constantly transferred from and to CPU through JS. Once the majority of operations will have their JS kernels, it will be way faster.'} />
         <FaqItem question={'Can I run it locally?'} answer={'Yes, this page’s code is available here: '} />
-        <FaqItem question={'Can I use your patched onnxruntime to run big LLMs with transformers.js?'} answer={'Yes, you can use this package but i don’t guarantee it will be working in all cases. This build is limited to 8GB of memory, so you can load up to ~4GB weights.'} />
+        <FaqItem question={'Can I use your patched onnxruntime to run big LLMs with transformers.js?'} answer={'Yes, you can use this package but i don’t guarantee it will be working in all cases. This build is limited to 8GB of memory, so you can load up to ~4GB weights. Just use https://www.npmjs.com/package/@aislamov/onnxruntime-web64'} />
         <FaqItem question={'Are you going to make a pull request in onnxruntime repo?'} answer={'Yes. It will be my second one, i’ve added GPU acceleration to node.js binding earlier.'} />
       </List>
     </Box>
@@ -84,17 +86,16 @@ function App() {
   }, [])
 
   const progressCallback = async (info: ProgressCallbackPayload) => {
+    if (info.step) {
+      setStatus(info.step)
+    }
     if (info.images) {
       const canvas = document.getElementById('canvas') as HTMLCanvasElement
       if (canvas) {
         const data = await info.images[0].toImageData({ tensorLayout: 'NCWH', format: 'RGB' });
-        console.log(data)
         canvas.getContext('2d')!.putImageData(data, 0, 0);
       }
     }
-    if (info.step) {
-      setStatus(info.step)
-    }
   }
   const loadModel = () => {
     if (!window.confirm('This will download approximately 3.5gb and use 8gb of your RAM. Are you sure want to continue?')) {

diff --git a/src/lib/StableDiffusionPipeline.ts b/src/lib/StableDiffusionPipeline.ts
@@ -1,4 +1,4 @@
-import { InferenceSession } from 'onnxruntime-web';
+import { InferenceSession } from '@aislamov/onnxruntime-web64';
 import { PNDMScheduler, SchedulerConfig } from './schedulers/PNDMScheduler'
 // @ts-ignore
 import { getModelFile, getModelJSON } from '@xenova/transformers/src/utils/hub'