fix: A1-14c run embedding model on Apple GPU via EMLX with EXLA-CPU fallback

2026-05-29 16:26:33 +02:00
parent d03d033548
commit 84b91750fb
7 changed files with 112 additions and 12 deletions
--- a/mix.exs
+++ b/mix.exs
@@ -36,6 +36,10 @@ defmodule BDS.MixProject do
      {:image, "~> 0.67"},
      {:nx, "~> 0.10"},
      {:exla, "~> 0.10"},
+      # Apple Silicon GPU (Metal) acceleration for embedding inference. Ships
+      # precompiled MLX binaries; the Neural backend prefers it on arm64 macOS
+      # and falls back to EXLA-CPU elsewhere (SPECGAPS A1-14c).
+      {:emlx, "~> 0.2.0"},
      {:bumblebee, "~> 0.6.3"},
      {:hnswlib, "~> 0.1.7"},
      {:stemex, "~> 0.2.1"},
@@ -64,7 +68,7 @@ defmodule BDS.MixProject do
    env = Mix.env()

    [
-      plt_add_apps: [:mix, :inets, :ssl, :nx, :exla, :bumblebee, :hnswlib],
+      plt_add_apps: [:mix, :inets, :ssl, :nx, :exla, :emlx, :bumblebee, :hnswlib],
      paths: ["_build/#{env}/lib/bds/ebin"]
    ]
  end