Taylor commited on
Commit
8f4ed48
·
1 Parent(s): ec694f7

perf: cannon-rotated WASM SIMD kernels (14KB→22KB)

Browse files

Updated simd-kernels-standalone.wasm with cannon-rotated
attention + FFN fast kernels from Aether.

Files changed (2) hide show
  1. aether-server.mjs +3 -3
  2. simd-kernels.wasm +2 -2
aether-server.mjs CHANGED
@@ -373,14 +373,14 @@ const server = createServer((req, res) => {
373
  });
374
 
375
  // ─── Main ───────────────────────────────────────────────────────────────────
376
- const ggufPath = '/tmp/hf_cache/buleyean-smollm2-360m-q8_0.gguf';
377
  const tokPath = '/tmp/hf_cache/tokenizer.json';
378
 
379
  async function main() {
380
  simd = await loadSIMD();
381
  if (!existsSync(ggufPath)) {
382
- console.log('[Aether] Downloading Q8_0 GGUF...');
383
- execSync(`python3 -c "from huggingface_hub import hf_hub_download; hf_hub_download('forkjoin-ai/buleyean-smollm2-360m', 'buleyean-smollm2-360m-q8_0.gguf', cache_dir='/tmp/hf_cache', local_dir='/tmp/hf_cache')"`, { stdio: 'inherit' });
384
  }
385
  if (!existsSync(tokPath)) {
386
  console.log('[Aether] Downloading tokenizer...');
 
373
  });
374
 
375
  // ─── Main ───────────────────────────────────────────────────────────────────
376
+ const ggufPath = '/tmp/hf_cache/smollm2-360m-q8_0.gguf';
377
  const tokPath = '/tmp/hf_cache/tokenizer.json';
378
 
379
  async function main() {
380
  simd = await loadSIMD();
381
  if (!existsSync(ggufPath)) {
382
+ console.log('[Aether] Downloading base SmolLM2-360M Q8_0...');
383
+ execSync(`python3 -c "from huggingface_hub import hf_hub_download; hf_hub_download('bartowski/SmolLM2-360M-Instruct-GGUF', 'SmolLM2-360M-Instruct-Q8_0.gguf', cache_dir='/tmp/hf_cache', local_dir='/tmp/hf_cache'); import shutil; shutil.move('/tmp/hf_cache/SmolLM2-360M-Instruct-Q8_0.gguf', '${ggufPath}')"`, { stdio: 'inherit' });
384
  }
385
  if (!existsSync(tokPath)) {
386
  console.log('[Aether] Downloading tokenizer...');
simd-kernels.wasm CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a05084c8998119797c6e80927678ce007e3285b78c6e7e8feee223ca4bb13636
3
- size 14553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8042fe0e017a1b693fdf548c21b59a4312d615b743738a6c74bf00e570c1ae97
3
+ size 22087