Kenshiin13
diff --git a/‎.github/workflows/release.yml‎
Lines changed: 10 additions & 61 deletions b/‎.github/workflows/release.yml‎
Lines changed: 10 additions & 61 deletions
diff --git a/‎README.md‎
Lines changed: 13 additions & 14 deletions b/‎README.md‎
Lines changed: 13 additions & 14 deletions
diff --git a/‎electron/electron-builder.config.js‎
Lines changed: 24 additions & 12 deletions b/‎electron/electron-builder.config.js‎
Lines changed: 24 additions & 12 deletions
@@ -12,19 +12,16 @@ on:
   workflow_dispatch:
 
 permissions:
-  contents: write   # required for softprops/action-gh-release to create releases
+  contents: write
 
 jobs:
   # ---------------------------------------------------------------------------
   build-windows:
     name: Build Windows (x64)
     runs-on: windows-latest
     steps:
-      - name: Checkout
-        uses: actions/checkout@v4
-
-      - name: Setup Node.js
-        uses: actions/setup-node@v4
+      - uses: actions/checkout@v4
+      - uses: actions/setup-node@v4
         with:
           node-version: '20'
           cache: 'npm'
@@ -34,10 +31,6 @@ jobs:
         working-directory: electron
         run: npm ci --legacy-peer-deps
 
-      - name: Bundle whisper.cpp binary + base model
-        working-directory: electron
-        run: npm run setup:whisper
-
       - name: Build renderer + main
         working-directory: electron
         run: npm run build
@@ -52,8 +45,7 @@ jobs:
         shell: bash
         run: ls -la dist/electron-release/
 
-      - name: Upload artifact
-        uses: actions/upload-artifact@v4
+      - uses: actions/upload-artifact@v4
         with:
           name: echo-windows-x64
           path: dist/electron-release/*.exe
@@ -63,13 +55,10 @@ jobs:
   # ---------------------------------------------------------------------------
   build-macos-arm64:
     name: Build macOS (Apple Silicon)
-    runs-on: macos-latest      # GitHub's default macOS runner is arm64
+    runs-on: macos-latest
     steps:
-      - name: Checkout
-        uses: actions/checkout@v4
-
-      - name: Setup Node.js
-        uses: actions/setup-node@v4
+      - uses: actions/checkout@v4
+      - uses: actions/setup-node@v4
         with:
           node-version: '20'
           cache: 'npm'
@@ -79,10 +68,6 @@ jobs:
         working-directory: electron
         run: npm ci --legacy-peer-deps
 
-      - name: Bundle whisper.cpp binary + base model
-        working-directory: electron
-        run: npm run setup:whisper
-
       - name: Build renderer + main
         working-directory: electron
         run: npm run build
@@ -96,67 +81,31 @@ jobs:
       - name: Show output
         run: ls -la dist/electron-release/
 
-      - name: Upload artifact
-        uses: actions/upload-artifact@v4
+      - uses: actions/upload-artifact@v4
         with:
           name: echo-macos-arm64
           path: dist/electron-release/*.dmg
           if-no-files-found: error
           retention-days: 14
 
-  # ---------------------------------------------------------------------------
-  # Intel macOS — uncomment to ship an x86_64 build too.
-  # macOS 13 is the last GitHub-hosted Intel runner image.
-  # ---------------------------------------------------------------------------
-  # build-macos-intel:
-  #   name: Build macOS (Intel)
-  #   runs-on: macos-13
-  #   steps:
-  #     - uses: actions/checkout@v4
-  #     - uses: actions/setup-node@v4
-  #       with:
-  #         node-version: '20'
-  #         cache: 'npm'
-  #         cache-dependency-path: electron/package-lock.json
-  #     - run: npm ci --legacy-peer-deps
-  #       working-directory: electron
-  #     - run: npm run build
-  #       working-directory: electron
-  #     - run: npx electron-builder --mac --x64 --publish never
-  #       working-directory: electron
-  #       env:
-  #         GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
-  #     - uses: actions/upload-artifact@v4
-  #       with:
-  #         name: echo-macos-x64
-  #         path: dist/electron-release/*.dmg
-  #         if-no-files-found: error
-  #         retention-days: 14
-
-  # ---------------------------------------------------------------------------
-  # Collect all artifacts and publish them as a GitHub Release.
-  # Only runs for tag pushes — manual runs leave the artifacts on the run.
   # ---------------------------------------------------------------------------
   release:
     name: Publish GitHub Release
     needs: [build-windows, build-macos-arm64]
     runs-on: ubuntu-latest
     if: startsWith(github.ref, 'refs/tags/')
     steps:
-      - name: Download all artifacts
-        uses: actions/download-artifact@v4
+      - uses: actions/download-artifact@v4
         with:
           path: artifacts
 
       - name: Flatten artifacts
         run: |
           mkdir -p release
           find artifacts -type f -exec mv {} release/ \;
-          echo "--- release contents ---"
           ls -la release/
 
-      - name: Publish release
-        uses: softprops/action-gh-release@v2
+      - uses: softprops/action-gh-release@v2
         with:
           files: release/*
           draft: false
 
@@ -10,7 +10,7 @@
 <p align="center">
   <a href="https://github.com/Kenshiin13/echo/releases"><img src="https://img.shields.io/github/v/release/Kenshiin13/echo?style=flat-square&color=3FA8E0" alt="Release"/></a>
   <img src="https://img.shields.io/badge/platform-Windows%20%7C%20macOS-1f2937?style=flat-square" alt="Platform"/>
-  <img src="https://img.shields.io/badge/whisper.cpp-v1.8.4-A855F7?style=flat-square" alt="whisper.cpp"/>
+  <img src="https://img.shields.io/badge/engine-onnxruntime--node-A855F7?style=flat-square" alt="onnxruntime-node"/>
 </p>
 
 ---
@@ -23,11 +23,10 @@
 
 - **Global push-to-talk** — press a hotkey anywhere (default `F9`), speak, release. Transcript is pasted at your cursor.
 - **Voice activation (optional)** — hands-free mode powered by [Silero VAD](https://github.com/snakers4/silero-vad). Flip it on in Settings and Echo auto-transcribes each utterance as you speak. Ignores non-speech noise.
-- **Fully local transcription** — all audio and transcription stays on-device via [whisper.cpp](https://github.com/ggml-org/whisper.cpp). Your voice never leaves your machine.
-- **Automatic translation (optional)** — point Echo at a target language and it will translate each transcript via [DeepL](https://www.deepl.com/) before pasting. Skipped automatically when you're already speaking the target language. Audio still stays local; only the transcript text is sent.
-- **Low-latency transcription** — Whisper runs as a persistent `whisper-server` process with the model kept resident in memory, so every utterance skips cold-load overhead.
-- **GPU acceleration** — CUDA on Windows (NVIDIA), Metal on Apple Silicon, CPU fallback everywhere.
-- **Five model sizes** — from 75 MB (`tiny`) to 1.6 GB (`large-v3-turbo`). Pick the accuracy/speed tradeoff you want.
+- **Fully local transcription** — Whisper runs in-process via [ONNX Runtime](https://onnxruntime.ai/) + [Transformers.js](https://huggingface.co/docs/transformers.js). Audio never leaves your machine.
+- **Automatic translation (optional)** — point Echo at a target language and it will translate each transcript via [DeepL](https://www.deepl.com/) before pasting. Audio stays local; only the transcript text is sent.
+- **Model kept resident** — loaded once at startup into the main process, reused for every utterance — no cold-load per transcription.
+- **Five model sizes** — from `tiny` to `large-v3-turbo`. Pick the accuracy/speed tradeoff you want.
 - **14 languages + auto-detect** — English, German, French, Spanish, Italian, Portuguese, Dutch, Russian, Chinese, Japanese, Korean, Arabic…
 - **Live audio indicator** — a small overlay shows a waveform while you speak, progress while a model downloads, and a check when paste completes.
 - **Model manager** — download, switch, and delete models from the settings window. New models download with a progress bar on first use.
@@ -40,18 +39,18 @@ Download the latest installer from the [Releases page](https://github.com/Kenshi
 
 | Platform | File |
 |----------|------|
-| Windows 10/11 (x64) | `Echo-Setup-X.Y.Z.exe` |
-| macOS (Apple Silicon) | `Echo-X.Y.Z-arm64.dmg` |
+| Windows 10/11 (x64) | `Echo.Setup.X.Y.Z.exe` |
+| macOS (Apple Silicon — M1/M2/M3/M4) | `Echo-X.Y.Z-arm64.dmg` |
 
 > **macOS note:** the build is unsigned (no paid Apple Developer ID). After dragging **Echo** to Applications, right-click the app → **Open** on first launch to bypass Gatekeeper.
 >
-> If macOS still refuses with *"Echo is damaged and can't be opened"*, it's the quarantine flag from the download. Clear it with:
+> If macOS still refuses with *"Echo is damaged and can't be opened"*, clear the quarantine flag:
 >
 > ```bash
 > xattr -cr /Applications/Echo.app && open /Applications/Echo.app
 > ```
 
-On first launch, Echo will auto-download the selected whisper model (`base` by default, ~142 MB) with a progress indicator. If you have an NVIDIA GPU and select the **CUDA** backend, it will also download the CUDA-enabled binary.
+On first launch, Echo will auto-download the selected Whisper model (`base` by default) into `~/.../Echo/whisper-models` with a progress indicator.
 
 ## Usage
 
@@ -77,8 +76,7 @@ Open settings from the tray icon. Everything is persisted to `electron-store` in
 | Push-to-talk hotkey | `F9` | Any key or modifier combo |
 | Exit shortcut | `Ctrl+Alt+Q` | Global quit |
 | Model size | `base` | `tiny` / `base` / `small` / `medium` / `large-v3-turbo` |
-| Language | Auto-detect | Pick one for better accuracy if auto-detect mis-fires |
-| Compute backend | Auto | `CPU` / `CUDA` / `MLX` — auto-selected based on hardware |
+| Language | Auto-detect | Pin one for slightly faster transcription + to enable the translate-skip optimization |
 | Auto-paste | On | Off = copy to clipboard only |
 | Voice activation | Off | Always-listening mode using Silero VAD (disables the hotkey) |
 | Translate transcription to | Off | Target language for automatic DeepL translation; skipped when you already speak it |
@@ -93,10 +91,11 @@ Requires Node.js 20+.
 git clone https://github.com/Kenshiin13/echo.git
 cd echo/electron
 npm install --legacy-peer-deps
-npm run setup:whisper   # downloads whisper.cpp binary + base model
 npm run dev             # dev mode with hot reload
 ```
 
+On first run Echo will download the selected Whisper ONNX model from Hugging Face.
+
 Package an installer:
 
 ```bash
@@ -111,7 +110,7 @@ Releases are automated — pushing a `v*` tag (e.g. `v1.2.0`) triggers the [rele
 - **[Electron 33](https://www.electronjs.org/)** — shell
 - **[React 18](https://react.dev/) + [Vite 6](https://vite.dev/)** — renderer (three entries: settings, indicator overlay, audio capture)
 - **[Mantine v7](https://mantine.dev/) + [Tailwind](https://tailwindcss.com/)** — UI
-- **[whisper.cpp](https://github.com/ggml-org/whisper.cpp)** — transcription engine, run as a long-lived `whisper-server` subprocess with the model kept resident in RAM
+- **[@huggingface/transformers](https://huggingface.co/docs/transformers.js)** + **[onnxruntime-node](https://onnxruntime.ai/)** — Whisper ASR runs in-process using ONNX models from [Xenova/whisper-*](https://huggingface.co/Xenova)
 - **[Silero VAD](https://github.com/snakers4/silero-vad)** via [@ricky0123/vad-web](https://github.com/ricky0123/vad) — neural voice activity detection for the voice-activation mode
 - **[DeepL API](https://www.deepl.com/pro-api)** — optional cloud translation layer between Whisper and paste
 - **[koffi](https://koffi.dev/)** — FFI for global key polling on Windows
 
@@ -16,19 +16,32 @@ module.exports = {
     output: "../dist/electron-release",
     buildResources: "build-resources",
   },
+  // Include the built output + runtime deps. electron-builder's default
+  // patterns get replaced when `files` is set explicitly, so we list what
+  // we need. Native .node binaries land where npm puts them under
+  // node_modules/<pkg>/... and stay unpacked via `asarUnpack` below.
   files: [
     "dist/**",
     "!dist/renderer/**/*.map",
-    // uiohook-napi is macOS/Linux only — exclude it from Windows builds
+    "node_modules/**/*",
+    "package.json",
+    // uiohook-napi is macOS/Linux only — skip on Windows builds.
     ...(process.platform === "win32" ? ["!node_modules/uiohook-napi/**"] : []),
+    // Dev-only noise — keep slim but don't over-filter.
+    "!node_modules/**/*.{md,map,ts,tsx}",
+    "!node_modules/**/{test,tests,__tests__,example,examples,docs,.github}/**",
+    "!node_modules/**/{LICENSE,license,LICENCE,licence,CHANGELOG,changelog,README,readme}{,.md,.txt,.markdown}",
   ],
+  // Native modules loaded via require() must sit on the real filesystem,
+  // not inside app.asar. All three are standard prebuilt-.node packages.
   asarUnpack: [
-    "node_modules/nodejs-whisper/**",
+    "node_modules/onnxruntime-node/**",
     "node_modules/koffi/**",
     "node_modules/@nut-tree-fork/**",
+    "node_modules/uiohook-napi/**",
   ],
-  // koffi ships pre-built Electron binaries — no native compilation needed.
-  // uiohook-napi requires MSVC and is not used on Windows; skip it via beforeBuild.
+  // Native modules need an Electron ABI rebuild on macOS/Linux. Windows
+  // ships prebuilts for all of them; skip rebuild to save a CI step.
   npmRebuild: process.platform !== "win32",
   beforeBuild: async (context) => {
     if (context.platform.name === "windows") {
@@ -38,6 +51,9 @@ module.exports = {
       if (fs.existsSync(p)) fs.rmSync(p, { recursive: true, force: true });
     }
   },
+  // Ad-hoc signs the macOS .app (no paid Apple Developer ID).
+  // No-op on Windows/Linux.
+  afterPack: "./scripts/mac-afterpack.js",
   extraResources: [
     {
       from: "../assets",
@@ -65,17 +81,13 @@ module.exports = {
   mac: {
     icon: "../assets/echo_macos_app_icon.icns",
     category: "public.app-category.productivity",
+    // Apple Silicon only (M1/M2/M3/M4). Intel Macs are not supported.
     target: [
       { target: "dmg", arch: ["arm64"] },
-      { target: "dmg", arch: ["x64"] },
     ],
-    // We don't have an Apple Developer ID, so we ship unsigned.
-    // `hardenedRuntime: true` with a missing/invalid signature makes Gatekeeper
-    // report the app as "damaged" with no right-click bypass — worse UX than
-    // shipping plain unsigned. `identity: null` tells electron-builder to skip
-    // signing entirely so Gatekeeper falls back to the normal "unidentified
-    // developer" prompt that users can bypass with right-click → Open (and, in
-    // the worst case, by clearing the quarantine xattr — see README).
+    // Unsigned — we don't have a paid Apple Developer ID. afterPack does
+    // an ad-hoc signing pass so Gatekeeper treats this as "unidentified
+    // developer" rather than "damaged" (right-click → Open to bypass).
     identity: null,
   },
   dmg: {