chore: publish safetensors NexaMat stack artifacts
Browse files- stack_manifest.json +121 -108
stack_manifest.json
CHANGED
|
@@ -1,121 +1,134 @@
|
|
| 1 |
{
|
|
|
|
|
|
|
|
|
|
| 2 |
"components": {
|
| 3 |
-
"controller": {
|
| 4 |
-
"base_model": "Qwen/Qwen3-14B",
|
| 5 |
-
"closeout_report": "docs/projects/Nexa_Mat/results/reports/2026-05-19_multimodal_h200_fft_closeout.md",
|
| 6 |
-
"model_repo": "AethronPhantom/Nexa_Mat2",
|
| 7 |
-
"model_subfolder": "multimodal/controller/nexa_mat_controller_fft_pilot_20260518T234148Z/final_model_merged",
|
| 8 |
-
"name": "nexa_mat_controller_qwen3_14b_fft_pilot",
|
| 9 |
-
"role": "semantic controller for ranking, rejection, evidence routing, and explanation",
|
| 10 |
-
"training_state": "partial_fft_pilot_not_full_dataset"
|
| 11 |
-
},
|
| 12 |
-
"cross_attention_bridge": {
|
| 13 |
-
"module": "nexa_train.materials.cross_attention.GatedCrossAttentionBridge",
|
| 14 |
-
"role": "inject text, encoder, decoder, task, and evidence streams into diffusion/controller memory",
|
| 15 |
-
"status": "implemented_adapter_surface"
|
| 16 |
-
},
|
| 17 |
-
"decoder": {
|
| 18 |
-
"artifact_uri": "wasabi:nexa-mat/models/nexa_mat/diffusion-generation-v1/prod/nexa_mat_diffusion_prod_fp32_b512_phase_sampler_20260512T162654Z/final_checkpoint.pt",
|
| 19 |
-
"closeout_report": "docs/projects/Nexa_Mat/results/reports/2026-05-13_diffusion_prod_225k_closeout.md",
|
| 20 |
-
"generation_mode": "distributional_sampler_best_of_n",
|
| 21 |
-
"name": "nexa_mat_diffusion_generation_v1",
|
| 22 |
-
"role": "constrained best-of-N candidate proposal and structure repair",
|
| 23 |
-
"run_root_uri": "wasabi:nexa-mat/models/nexa_mat/diffusion-generation-v1/prod/nexa_mat_diffusion_prod_fp32_b512_phase_sampler_20260512T162654Z"
|
| 24 |
-
},
|
| 25 |
"encoder": {
|
| 26 |
-
"
|
| 27 |
-
"
|
| 28 |
-
"
|
| 29 |
-
"
|
| 30 |
-
"
|
| 31 |
-
"
|
| 32 |
-
|
| 33 |
-
|
| 34 |
-
|
| 35 |
-
|
| 36 |
-
|
| 37 |
-
"all_fixture": {
|
| 38 |
-
"alignment_gates": 3,
|
| 39 |
-
"alignment_score": 0.4315514275885793,
|
| 40 |
-
"candidate_decision_accuracy": 0.16666666666666666,
|
| 41 |
-
"candidates": 6,
|
| 42 |
-
"controller_alignment_promotable": false,
|
| 43 |
-
"criteria": {
|
| 44 |
-
"alignment_ready_for_fft": true,
|
| 45 |
-
"bad_candidate_false_positive_max": 0.0,
|
| 46 |
-
"min_frontier_preservation": 1.0,
|
| 47 |
-
"min_known_deprioritization": 1.0,
|
| 48 |
-
"uncontained_hallucination_max": 0.0
|
| 49 |
},
|
| 50 |
-
"
|
| 51 |
-
|
| 52 |
-
|
| 53 |
-
"
|
| 54 |
-
"
|
| 55 |
-
"
|
| 56 |
-
"
|
| 57 |
-
"
|
|
|
|
|
|
|
|
|
|
| 58 |
},
|
| 59 |
-
"
|
| 60 |
-
|
| 61 |
-
"
|
| 62 |
-
|
| 63 |
-
|
| 64 |
-
|
| 65 |
-
"report": "/dev/shm/nexa_mat_controller_rollout_all_eval.md",
|
| 66 |
-
"structured_output_validity": 0.16666666666666666,
|
| 67 |
-
"uncontained_hallucination_rate": 1.0
|
| 68 |
-
},
|
| 69 |
-
"artifact_paths": {
|
| 70 |
-
"all_predictions.jsonl": "eval/controller_smoke/all_predictions.jsonl",
|
| 71 |
-
"all_summary.json": "eval/controller_smoke/all_summary.json",
|
| 72 |
-
"reverse_predictions.jsonl": "eval/controller_smoke/reverse_predictions.jsonl",
|
| 73 |
-
"reverse_summary.json": "eval/controller_smoke/reverse_summary.json"
|
| 74 |
},
|
| 75 |
-
"
|
| 76 |
-
|
| 77 |
-
"
|
| 78 |
-
"
|
| 79 |
-
"
|
| 80 |
-
"
|
| 81 |
-
"
|
| 82 |
-
"
|
| 83 |
-
|
| 84 |
-
|
| 85 |
-
"
|
| 86 |
-
"
|
| 87 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 88 |
},
|
| 89 |
-
"
|
| 90 |
-
|
| 91 |
-
|
| 92 |
-
"
|
| 93 |
-
"
|
| 94 |
-
"known_deprioritization": true,
|
| 95 |
-
"ready_for_fft": true,
|
| 96 |
-
"uncontained_hallucination": true
|
| 97 |
},
|
| 98 |
-
"
|
| 99 |
-
|
| 100 |
-
"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 101 |
],
|
| 102 |
-
"
|
| 103 |
-
"
|
| 104 |
-
"report": "/dev/shm/nexa_mat_controller_rollout_reverse_eval.md",
|
| 105 |
-
"structured_output_validity": 1.0,
|
| 106 |
-
"uncontained_hallucination_rate": 0.0
|
| 107 |
}
|
| 108 |
},
|
| 109 |
-
"
|
| 110 |
-
"
|
| 111 |
-
"
|
| 112 |
-
|
| 113 |
-
"preserve physically plausible low-evidence novelty as DFT candidates",
|
| 114 |
-
"deprioritize known duplicates unless conservative mode allows them",
|
| 115 |
-
"route unsupported claims to retrieve-more or human review"
|
| 116 |
-
],
|
| 117 |
-
"reverse": "candidate pool -> encoder/task/evidence scoring -> optional decoder expansion -> controller rank/filter/explain"
|
| 118 |
},
|
| 119 |
-
"
|
| 120 |
-
|
|
|
|
|
|
|
|
|
|
| 121 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"name": "Nexa_Mat Gen Stack",
|
| 3 |
+
"model_id": "AethronPhantom/Nexa_Mat2",
|
| 4 |
+
"published_at": "2026-05-20T01:11:29Z",
|
| 5 |
"components": {
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 6 |
"encoder": {
|
| 7 |
+
"component": "nexa_mat_encoder_v1",
|
| 8 |
+
"role": "frozen physics-grounding encoder",
|
| 9 |
+
"repo_id": "AethronPhantom/Nexa_Mat2",
|
| 10 |
+
"path": "encoder/v1/nexa_mat_V1_final.safetensors",
|
| 11 |
+
"artifact_uri": "hf://AethronPhantom/Nexa_Mat2/encoder/v1/nexa_mat_V1_final.safetensors",
|
| 12 |
+
"source_checkpoint_uri": "wasabi:nexa-mat/models/nexa_mat/encoder-pretrain/full_v1/2026-05-06/nexa_mat_encoder_blackwell_full_v1_continue_to_200k_20260506T075034Z/nexa_mat_V1_final.pt",
|
| 13 |
+
"published_at": "2026-05-20T01:11:29Z",
|
| 14 |
+
"format": "safetensors_model_state_only",
|
| 15 |
+
"stats": {
|
| 16 |
+
"bytes": 11264456,
|
| 17 |
+
"sha256": "a39e1db3c86622cc36bc2610a47af0f6336578fc3b644a7068ed62190853e9a0"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 18 |
},
|
| 19 |
+
"architecture": {
|
| 20 |
+
"family": "directional_potential",
|
| 21 |
+
"hidden_dim": 192,
|
| 22 |
+
"egnn_layers": 4,
|
| 23 |
+
"max_neighbors": 8,
|
| 24 |
+
"radial_basis": 64,
|
| 25 |
+
"cutoff_angstrom": 6.0,
|
| 26 |
+
"message_aggregation": "learned",
|
| 27 |
+
"energy_mode": "atomwise_sum",
|
| 28 |
+
"absolute_coords": false,
|
| 29 |
+
"parameters": 2813714
|
| 30 |
},
|
| 31 |
+
"training": {
|
| 32 |
+
"phase": "encoder_full_pretrain_v1",
|
| 33 |
+
"steps": 200000,
|
| 34 |
+
"dataset": "nexa_mat_v1 force-compatible OMat24 surface",
|
| 35 |
+
"science_status": "frozen_for_downstream_generative_experiments"
|
| 36 |
+
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 37 |
},
|
| 38 |
+
"diffusion_decoder": {
|
| 39 |
+
"component": "nexa_mat_diffusion_v1",
|
| 40 |
+
"role": "constrained best-of-N diffusion proposal decoder",
|
| 41 |
+
"repo_id": "AethronPhantom/Nexa_Mat2",
|
| 42 |
+
"path": "decoder/diffusion_v1/final_checkpoint.safetensors",
|
| 43 |
+
"artifact_uri": "hf://AethronPhantom/Nexa_Mat2/decoder/diffusion_v1/final_checkpoint.safetensors",
|
| 44 |
+
"source_checkpoint_uri": "wasabi:nexa-mat/models/nexa_mat/diffusion-generation-v1/prod/nexa_mat_diffusion_prod_fp32_b512_phase_sampler_20260512T162654Z/final_checkpoint.pt",
|
| 45 |
+
"published_at": "2026-05-20T01:11:29Z",
|
| 46 |
+
"format": "safetensors_model_state_only",
|
| 47 |
+
"stats": {
|
| 48 |
+
"bytes": 16263948,
|
| 49 |
+
"sha256": "d55b837f9600e82846e396f1a9384d52e99a17c43ac5a7d53bd14bb24d3e7395"
|
| 50 |
+
},
|
| 51 |
+
"architecture": {
|
| 52 |
+
"training_mode": "template-conditioned diffusion repair",
|
| 53 |
+
"precision": "fp32",
|
| 54 |
+
"frozen_encoder_parameters": 2813714,
|
| 55 |
+
"trainable_diffusion_parameters": 1248145,
|
| 56 |
+
"full_parameters": 4061859,
|
| 57 |
+
"uses_encoder_features": true,
|
| 58 |
+
"branches": [
|
| 59 |
+
"atom_reconstruction",
|
| 60 |
+
"fractional_coordinate_repair",
|
| 61 |
+
"pair_distance_repair",
|
| 62 |
+
"lattice_residual_repair",
|
| 63 |
+
"conservative_update_gates"
|
| 64 |
+
]
|
| 65 |
},
|
| 66 |
+
"training": {
|
| 67 |
+
"phase": "diffusion_generation_v1_prod",
|
| 68 |
+
"steps": 225000,
|
| 69 |
+
"operating_mode": "sampler_aware_best_of_n_with_filtering",
|
| 70 |
+
"science_status": "usable_as_constrained_generator_not_one_shot_oracle"
|
|
|
|
|
|
|
|
|
|
| 71 |
},
|
| 72 |
+
"final_eval": {
|
| 73 |
+
"atom_accuracy": 0.99988,
|
| 74 |
+
"coord_improvement_fraction": 0.70544,
|
| 75 |
+
"pair_distance_improvement_fraction": 0.7122,
|
| 76 |
+
"lattice_improvement_fraction": 0.55273,
|
| 77 |
+
"sampler_valid_geometry_rate": 0.66406,
|
| 78 |
+
"valid_geometry_rate": 0.75
|
| 79 |
+
}
|
| 80 |
+
},
|
| 81 |
+
"multimodal_controller": {
|
| 82 |
+
"component": "qwen3_14b_controller_partial_fft",
|
| 83 |
+
"repo_id": "AethronPhantom/Nexa_Mat2",
|
| 84 |
+
"path": "multimodal/controller/nexa_mat_controller_fft_pilot_20260518T234148Z/final_model_merged/model.safetensors",
|
| 85 |
+
"artifact_uri": "hf://AethronPhantom/Nexa_Mat2/multimodal/controller/nexa_mat_controller_fft_pilot_20260518T234148Z/final_model_merged/model.safetensors",
|
| 86 |
+
"base_model": "Qwen/Qwen3-14B",
|
| 87 |
+
"status": "experimental_controller_partial_fft"
|
| 88 |
+
},
|
| 89 |
+
"cross_attention": {
|
| 90 |
+
"component": "nexa_mat_cross_attention_contract_v1",
|
| 91 |
+
"status": "interface_contract",
|
| 92 |
+
"purpose": "condition diffusion proposals and multimodal controller evidence on shared structure, text, task, and model-state lanes",
|
| 93 |
+
"lanes": [
|
| 94 |
+
{
|
| 95 |
+
"name": "structure_latent",
|
| 96 |
+
"producer": "encoder/v1/nexa_mat_V1_final.safetensors",
|
| 97 |
+
"consumer": "diffusion decoder and controller"
|
| 98 |
+
},
|
| 99 |
+
{
|
| 100 |
+
"name": "diffusion_state",
|
| 101 |
+
"producer": "decoder/diffusion_v1/final_checkpoint.safetensors",
|
| 102 |
+
"consumer": "controller ranking and evidence packet"
|
| 103 |
+
},
|
| 104 |
+
{
|
| 105 |
+
"name": "text_intent",
|
| 106 |
+
"producer": "Qwen controller tokens",
|
| 107 |
+
"consumer": "diffusion conditioning and reverse ranking"
|
| 108 |
+
},
|
| 109 |
+
{
|
| 110 |
+
"name": "evidence_context",
|
| 111 |
+
"producer": "retrieval/controller",
|
| 112 |
+
"consumer": "decision layer"
|
| 113 |
+
},
|
| 114 |
+
{
|
| 115 |
+
"name": "task_heads",
|
| 116 |
+
"producer": "SSB/battery-ion adapters",
|
| 117 |
+
"consumer": "reverse pool scoring and use-case constraints"
|
| 118 |
+
}
|
| 119 |
],
|
| 120 |
+
"forward_flow": "constraints -> controller intent tokens -> diffusion proposals -> encoder plausibility scoring -> controller evidence and ranking",
|
| 121 |
+
"reverse_flow": "candidate pool -> encoder/task/evidence scoring -> optional decoder expansion -> controller rank/filter/explain"
|
|
|
|
|
|
|
|
|
|
| 122 |
}
|
| 123 |
},
|
| 124 |
+
"space": {
|
| 125 |
+
"repo_id": "AethronPhantom/nexamat-crystal-viewer",
|
| 126 |
+
"url": "https://huggingface.co/spaces/AethronPhantom/nexamat-crystal-viewer",
|
| 127 |
+
"runtime": "gradio.Server custom frontend with ZeroGPU model_stack hook"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 128 |
},
|
| 129 |
+
"safety_and_limits": [
|
| 130 |
+
"Generated structures are candidates for triage, not DFT-confirmed stable materials.",
|
| 131 |
+
"Decoder is best used as constrained best-of-N generation with encoder filtering.",
|
| 132 |
+
"Controller is experimental and should ground claims in evidence/context rather than inventing support."
|
| 133 |
+
]
|
| 134 |
}
|