Gunnar Beck Nelson commited on
Commit
9019349
·
unverified ·
1 Parent(s): b39b328

Selora AI v0.4.7

Browse files
manifest.json CHANGED
@@ -1,50 +1,54 @@
1
  {
2
  "name": "selora-ai-local",
3
  "version": "0.4.7",
4
- "description": "Selora AI v0.4.7 \u2014 built on top of [Qwen/Qwen3-1.7B](https://huggingface.co/Qwen/Qwen3-1.7B) (Apache-2.0). F16 base + 4 LoRA specialists with slim action-then-confirm output schemas (command, automation, answer, clarification). Trained with [mlx-lm](https://github.com/ml-explore/mlx-examples) on Apple Silicon. Inference: cache_prompt enabled to amortize system-prompt KV cache across requests.",
5
  "base_model": {
6
  "id": "Qwen/Qwen3-1.7B",
7
  "format": "gguf",
8
- "dtype": "F16",
9
- "filename": "qwen3_17b_base.f16.gguf",
10
- "size_bytes": 4069678880,
11
- "sha256": "3e4009f0d96955a45f29aa77bded839d376d7832823c6909f76c84ace81dc445"
12
  },
13
  "loras": [
14
  {
15
  "slot": 0,
16
  "name": "command",
 
17
  "filename": "selora-v047-command.f16.gguf",
18
  "size_bytes": 19938528,
19
- "sha256": "b10b5131157698400ee9fafac08ab4101b81230a79ad067eb8f89bd4e29a6273"
20
  },
21
  {
22
  "slot": 1,
23
  "name": "automation",
 
24
  "filename": "selora-v047-automation.f16.gguf",
25
- "size_bytes": 37374880,
26
- "sha256": "1bdd8c54cb36332889498a67046f01b55de7e5ac019e350419ba98a9c104f78f"
27
  },
28
  {
29
  "slot": 2,
30
  "name": "answer",
 
31
  "filename": "selora-v047-answer.f16.gguf",
32
  "size_bytes": 14957792,
33
- "sha256": "9ec14105e7119675a75c1e166c132298886f4a25e57628c4ef720fce2080171e"
34
  },
35
  {
36
  "slot": 3,
37
  "name": "clarification",
 
38
  "filename": "selora-v047-clarification.f16.gguf",
39
  "size_bytes": 9977056,
40
- "sha256": "071558279b1bc8c8609fc63a1524604aa7fcf721c5bd6d3ecdf1f55ad16f5e1a"
41
  }
42
  ],
43
  "system_prompts": {
44
  "command": {
45
  "filename": "command_system_prompt.txt",
46
- "size_bytes": 1071,
47
- "sha256": "9921c6fef09c6ebad4a2ed4fad1dbe7e76efe0bfe4e532bf7c7fe096864de6a4"
48
  },
49
  "automation": {
50
  "filename": "automation_system_prompt.txt",
@@ -64,12 +68,29 @@
64
  },
65
  "runtime": {
66
  "cache_prompt": true,
67
- "ctx_size": 4096
68
  },
69
  "training": {
70
  "framework": "mlx-lm",
71
  "base_model_repo": "Qwen/Qwen3-1.7B",
72
- "english_only": true,
73
- "workspace_version": "0.4.7"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
74
  }
75
  }
 
1
  {
2
  "name": "selora-ai-local",
3
  "version": "0.4.7",
4
+ "description": "Selora AI v0.4.7 \u2014 Qwen3-1.7B Q6_K base + 4 LoRA specialists. Hub-optimal base quant (fits Vega 8 VRAM, no GTT spill). Specialists retrained on a compacted-JSON corpus (automation rank 32); command specialist prompt updated, other three unchanged from v0.4.6.",
5
  "base_model": {
6
  "id": "Qwen/Qwen3-1.7B",
7
  "format": "gguf",
8
+ "dtype": "Q6_K",
9
+ "filename": "qwen3_17b_base.Q6_K.gguf",
10
+ "size_bytes": 1673006880,
11
+ "sha256": "a00bbdb411872149d73e1a0683b9b8a9f13cf74f98ba70ff8e8e430d9a093179"
12
  },
13
  "loras": [
14
  {
15
  "slot": 0,
16
  "name": "command",
17
+ "rank": 16,
18
  "filename": "selora-v047-command.f16.gguf",
19
  "size_bytes": 19938528,
20
+ "sha256": "49ba46bc054259409f5cd52eb3d9971101ed858fba27c6678c89e145815af515"
21
  },
22
  {
23
  "slot": 1,
24
  "name": "automation",
25
+ "rank": 32,
26
  "filename": "selora-v047-automation.f16.gguf",
27
+ "size_bytes": 59791968,
28
+ "sha256": "32e5633f0e554fec5e336d993647065f85a4fffd348366cdc3417ca34824b527"
29
  },
30
  {
31
  "slot": 2,
32
  "name": "answer",
33
+ "rank": 12,
34
  "filename": "selora-v047-answer.f16.gguf",
35
  "size_bytes": 14957792,
36
+ "sha256": "7584a04e13dd3e4973bfeb89ed01b7b29b3288d768d7bee15bcea3de89ff50c7"
37
  },
38
  {
39
  "slot": 3,
40
  "name": "clarification",
41
+ "rank": 8,
42
  "filename": "selora-v047-clarification.f16.gguf",
43
  "size_bytes": 9977056,
44
+ "sha256": "75c06c0efbd9ca1e7108ec6ec5811f68e2dc5639d01ef583148a151b11398847"
45
  }
46
  ],
47
  "system_prompts": {
48
  "command": {
49
  "filename": "command_system_prompt.txt",
50
+ "size_bytes": 1374,
51
+ "sha256": "0fa2b1669dedca18ddba2cebd7f72cd7cff0f7431b87ca4166a4bf60c7aed697"
52
  },
53
  "automation": {
54
  "filename": "automation_system_prompt.txt",
 
68
  },
69
  "runtime": {
70
  "cache_prompt": true,
71
+ "ctx_size": 8192
72
  },
73
  "training": {
74
  "framework": "mlx-lm",
75
  "base_model_repo": "Qwen/Qwen3-1.7B",
76
+ "scale": 20.0,
77
+ "rank_per_specialist": {
78
+ "command": 16,
79
+ "automation": 32,
80
+ "answer": 12,
81
+ "clarification": 8
82
+ },
83
+ "iterations_per_specialist": {
84
+ "command": 800,
85
+ "automation": 1800,
86
+ "answer": 600,
87
+ "clarification": 450
88
+ },
89
+ "examples_per_specialist": {
90
+ "command": 11000,
91
+ "automation": 10000,
92
+ "answer": 5500,
93
+ "clarification": 3000
94
+ }
95
  }
96
  }
prompts/command_system_prompt.txt CHANGED
@@ -5,11 +5,11 @@ Given a user command and the AVAILABLE ENTITIES list, respond with ONE JSON obje
5
 
6
  Rules:
7
  - c: ordered array of one or more service calls. Calls execute in array order.
8
- - s: HA service in "domain.action" form (e.g. "light.turn_on", "lock.lock", "media_player.play_media", "scene.turn_on").
9
  - e: canonical entity_id from AVAILABLE ENTITIES. Never use the human alias — always the entity_id.
10
  - d: service parameters object. Omit the d key entirely when there are no params (do not include "d":{}).
11
  - r: ≤ 1 sentence past-tense confirmation describing what got done (e.g. "Kitchen light on.").
12
- - The service domain (before the dot) must match the entity_id's domain. light.turn_on goes with light.* entities, lock.lock goes with lock.* entities, etc.
13
  - For multi-target requests, produce one c entry per (service, entity_id) pair.
14
 
15
  Output JSON only — no narration, no markdown fences, no chain-of-thought.
 
5
 
6
  Rules:
7
  - c: ordered array of one or more service calls. Calls execute in array order.
8
+ - s: HA service in "domain.action" form. Only these domains are accepted for immediate execution: light, switch, fan, media_player, climate, input_boolean, scene, cover. Examples: "light.turn_on", "switch.turn_off", "media_player.media_play", "cover.open_cover", "scene.turn_on". Do not emit lock.*, alarm_*, script.*, notify.*, or any other domain — those are blocked by the safety policy and the call will fail.
9
  - e: canonical entity_id from AVAILABLE ENTITIES. Never use the human alias — always the entity_id.
10
  - d: service parameters object. Omit the d key entirely when there are no params (do not include "d":{}).
11
  - r: ≤ 1 sentence past-tense confirmation describing what got done (e.g. "Kitchen light on.").
12
+ - The service domain (before the dot) must match the entity_id's domain. light.turn_on goes with light.* entities, cover.open_cover goes with cover.* entities, etc.
13
  - For multi-target requests, produce one c entry per (service, entity_id) pair.
14
 
15
  Output JSON only — no narration, no markdown fences, no chain-of-thought.
qwen3_17b_base.f16.gguf DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e4009f0d96955a45f29aa77bded839d376d7832823c6909f76c84ace81dc445
3
- size 4069678880
 
 
 
 
selora-v047-answer.f16.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9ec14105e7119675a75c1e166c132298886f4a25e57628c4ef720fce2080171e
3
  size 14957792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7584a04e13dd3e4973bfeb89ed01b7b29b3288d768d7bee15bcea3de89ff50c7
3
  size 14957792
selora-v047-automation.f16.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1bdd8c54cb36332889498a67046f01b55de7e5ac019e350419ba98a9c104f78f
3
- size 37374880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32e5633f0e554fec5e336d993647065f85a4fffd348366cdc3417ca34824b527
3
+ size 59791968
selora-v047-clarification.f16.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:071558279b1bc8c8609fc63a1524604aa7fcf721c5bd6d3ecdf1f55ad16f5e1a
3
  size 9977056
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75c06c0efbd9ca1e7108ec6ec5811f68e2dc5639d01ef583148a151b11398847
3
  size 9977056
selora-v047-command.f16.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b10b5131157698400ee9fafac08ab4101b81230a79ad067eb8f89bd4e29a6273
3
  size 19938528
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49ba46bc054259409f5cd52eb3d9971101ed858fba27c6678c89e145815af515
3
  size 19938528