HiMind
/

Multi-Mixture_Speaker_ID

Voice Activity Detection

Model card Files Files and versions

xet

Community

HiMind commited on 12 days ago

Commit

81fa0ce

verified ·

1 Parent(s): 34aca5b

Upload 3 files

Browse files

Files changed (3) hide show

ASI.py +303 -0
MMM.py +1077 -0
mmm.pt +3 -0

ASI.py ADDED Viewed

	@@ -0,0 +1,303 @@

+# Speaker_ID.py
+# By Chance Brownfield
+import torch
+import numpy as np
+import librosa
+import asyncio
+import tempfile
+import os
+import time
+import traceback
+from typing import AsyncGenerator, Dict, Any, Optional, Union, Iterable
+import speech_recognition as sr
+from MMM import MMM
+class Speaker_ID:
+    def __init__(
+        self,
+        mmm_manager,
+        base_model_id: str = "unknown",
+        device: Union[str, torch.device, None] = None,
+        seq_len: int = 1200,
+        sr: int = 1200,
+    ):
+        self.mmm = mmm_manager
+        self.base_model_id = base_model_id
+        self.seq_len = int(seq_len)
+        self.sr = int(sr)
+        if device is None:
+            self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+        else:
+            self.device = torch.device(device)
+        if not hasattr(self.mmm, "models"):
+            raise ValueError("Provided mmm_manager does not look like an MMM manager (missing .models).")
+        if self.base_model_id not in self.mmm.models:
+            available = list(self.mmm.models.keys())
+            raise KeyError(f"Base model id '{self.base_model_id}' not found. Available keys: {available}")
+        self.base_model = self.mmm.models[self.base_model_id].to(self.device)
+        self.base_model.eval()
+    def _audio_to_tensor(self, wav_path: str) -> torch.Tensor:
+        y, _ = librosa.load(str(wav_path), sr=self.sr, mono=True)
+        y = y.astype(np.float32)
+        if y.size == 0:
+            raise RuntimeError(f"Empty audio file: {wav_path}")
+        maxv = float(np.max(np.abs(y)))
+        if maxv > 0:
+            y = y / maxv
+        if y.shape[0] < self.seq_len:
+            y = np.pad(y, (0, self.seq_len - y.shape[0]))
+        else:
+            y = y[: self.seq_len]
+        return torch.from_numpy(y).unsqueeze(-1)
+    def _ensure_tensor(self, features: Union[np.ndarray, torch.Tensor]) -> torch.Tensor:
+        if isinstance(features, np.ndarray):
+            t = torch.from_numpy(features)
+        elif torch.is_tensor(features):
+            t = features.clone()
+        else:
+            raise TypeError("audio_features must be numpy array or torch tensor or audio file path")
+        if t.dim() == 1:
+            t = t.unsqueeze(-1)
+        if t.dim() == 2:
+            return t.float()
+        raise ValueError(f"Unexpected features tensor shape: {t.shape}")
+    def generate_embedding(self, audio_input: Union[str, np.ndarray, torch.Tensor]) -> np.ndarray:
+        if isinstance(audio_input, str):
+            x = self._audio_to_tensor(audio_input)
+        else:
+            x = self._ensure_tensor(audio_input)
+        x = x.to(self.device)
+        if x.dim() == 2:
+            x = x.unsqueeze(1)
+        with torch.no_grad():
+            out = self.base_model(x)
+        if isinstance(out, dict):
+            if "mu" in out:
+                mu = out["mu"]
+                emb_bz = mu.mean(dim=0)
+                emb = emb_bz.squeeze(0).cpu().numpy()
+                return emb
+            if "z" in out:
+                z = out["z"].mean(dim=0).squeeze(0).cpu().numpy()
+                return z
+            if "reconstruction" in out:
+                recon = out["reconstruction"].mean(dim=0).squeeze(0).cpu().numpy()
+                return recon
+        if torch.is_tensor(out):
+            arr = out.mean(dim=0).squeeze(0).cpu().numpy()
+            return arr
+        raise KeyError("Base model forward did not return 'mu', 'z', 'reconstruction' or a tensor to use as embedding.")
+    def enroll_speaker(
+        self,
+        speaker_id: str,
+        audio_input: Union[str, np.ndarray, torch.Tensor],
+        model_type: str = "mmm",
+        n_components: int = 4,
+        epochs: int = 50,
+        lr: float = 1e-3,
+        seq_len_for_mmm: int = None,
+        **fit_kwargs,
+    ) -> str:
+        model_type = model_type.lower()
+        if model_type not in ("gmm", "hmm", "mmm"):
+            raise ValueError("model_type must be 'gmm', 'hmm', or 'mmm'")
+        emb = self.generate_embedding(audio_input)  # (Z,)
+        if model_type == "gmm":
+            X = np.asarray(emb, dtype=np.float32)[None, :]  # (1, Z)
+            self.mmm.fit_and_add(
+                data=X,
+                model_type="gmm",
+                model_id=speaker_id,
+                n_components=n_components,
+                lr=lr,
+                epochs=epochs,
+                **fit_kwargs,
+            )
+        else:
+            T = int(seq_len_for_mmm or self.seq_len)
+            z = torch.tensor(emb, dtype=torch.float32, device=self.device)
+            seq = z.unsqueeze(0).repeat(T, 1)
+            seq = seq.unsqueeze(1)
+            self.mmm.fit_and_add(
+                data=seq,
+                model_type="mmm" if model_type == "mmm" else "hmm",
+                model_id=speaker_id,
+                input_dim=emb.shape[-1],
+                output_dim=emb.shape[-1],
+                hidden_dim=emb.shape[-1] * 2,
+                z_dim=min(256, emb.shape[-1]),
+                rnn_hidden=emb.shape[-1],
+                num_states=fit_kwargs.get("num_states", 8),
+                n_mix=fit_kwargs.get("n_mix", 2),
+                trans_d_model=fit_kwargs.get("trans_d_model", 64),
+                trans_nhead=fit_kwargs.get("trans_nhead", 4),
+                trans_layers=fit_kwargs.get("trans_layers", 2),
+                lr=lr,
+                epochs=epochs,
+                **fit_kwargs,
+            )
+        return speaker_id
+    def identify(
+        self,
+        audio_input: Union[str, np.ndarray, torch.Tensor],
+        unknown_label_confidence_margin: float = 0.0,
+    ):
+        emb = self.generate_embedding(audio_input)
+        emb_np = np.asarray(emb, dtype=np.float32)
+        X_try = emb_np[None, :]
+        scores: Dict[str, float] = {}
+        for model_id in list(self.mmm.models.keys()):
+            try:
+                sc = self.mmm.score(model_id, X_try)
+                if isinstance(sc, dict):
+                    vals = []
+                    for v in sc.values():
+                        try:
+                            vals.append(float(np.asarray(v).mean()))
+                        except Exception:
+                            pass
+                    score_val = float(np.mean(vals)) if vals else float("nan")
+                else:
+                    try:
+                        score_val = float(np.asarray(sc).mean())
+                    except Exception:
+                        score_val = float(sc)
+                scores[model_id] = score_val
+            except Exception:
+                try:
+                    T = self.seq_len
+                    seq = np.tile(emb_np[None, :], (T, 1, 1))
+                    sc = self.mmm.score(model_id, seq)
+                    try:
+                        scores[model_id] = float(np.asarray(sc).mean())
+                    except Exception:
+                        scores[model_id] = float(sc)
+                except Exception:
+                    continue
+        if not scores:
+            return self.base_model_id, float("nan"), {}
+        best_model, best_score = max(scores.items(), key=lambda kv: kv[1])
+        if best_model != self.base_model_id and unknown_label_confidence_margin > 0.0:
+            unknown_score = scores.get(self.base_model_id, float("-inf"))
+            if best_score <= unknown_score + unknown_label_confidence_margin:
+                return self.base_model_id, unknown_score, scores
+        return best_model, best_score, scores
+# -------- Automatic Speaker Identification --------
+async def ASI(
+    phrase_time_limit: Optional[float] = 3.0,
+    queue_maxsize: int = 8,
+    mmm_pt_path: str = "models/MMM/mmm.pt",
+) -> AsyncGenerator[Dict[str, Any], None]:
+    mgr = MMM.load(mmm_pt_path)
+    speaker_system = Speaker_ID(mmm_manager=mgr, base_model_id="unknown", seq_len=1200, sr=1200)
+    loop = asyncio.get_running_loop()
+    audio_q: asyncio.Queue = asyncio.Queue(maxsize=queue_maxsize)
+    recognizer = sr.Recognizer()
+    try:
+        mic = sr.Microphone()
+    except Exception as e:
+        raise RuntimeError("Could not open microphone. Check drivers / permissions.") from e
+    def _bg_callback(recognizer_obj: sr.Recognizer, audio: sr.AudioData) -> None:
+        try:
+            wav_bytes = audio.get_wav_data()
+            try:
+                loop.call_soon_threadsafe(audio_q.put_nowait, wav_bytes)
+            except Exception:
+                pass
+        except Exception:
+            traceback.print_exc()
+    stop_listening = recognizer.listen_in_background(mic, _bg_callback, phrase_time_limit=phrase_time_limit)
+    try:
+        while True:
+            try:
+                wav_bytes = await audio_q.get()
+            except asyncio.CancelledError:
+                break
+            if wav_bytes is None:
+                continue
+            def _write_temp_wav(b: bytes) -> str:
+                tf = tempfile.NamedTemporaryFile(suffix=".wav", delete=False)
+                try:
+                    tf.write(b)
+                    tf.flush()
+                    return tf.name
+                finally:
+                    tf.close()
+            tmp_path = await loop.run_in_executor(None, _write_temp_wav, wav_bytes)
+            try:
+                result = await loop.run_in_executor(None, speaker_system.identify, tmp_path)
+                best_speaker, best_score, scores = result
+                yield {
+                    "speaker": best_speaker,
+                    "score": best_score,
+                    "scores": scores,
+                    "path": tmp_path,
+                    "timestamp": time.time(),
+                }
+            except Exception as e:
+                yield {
+                    "error": str(e),
+                    "traceback": traceback.format_exc(),
+                    "path": tmp_path,
+                    "timestamp": time.time(),
+                }
+            finally:
+                try:
+                    os.remove(tmp_path)
+                except Exception:
+                    pass
+    finally:
+        try:
+            stop_listening(wait_for_stop=False)
+        except Exception:
+            pass
+async def _main_cli():
+    async for res in ASI(phrase_time_limit=3.0):
+        if "error" in res:
+            print("ID error:", res["error"])
+        else:
+            ts = time.ctime(res["timestamp"])
+            print(f"[{ts}] Predicted: {res['speaker']} (score={res['score']})")
+            print("All scores:", res["scores"])
+if __name__ == "__main__":
+    asyncio.run(_main_cli())

MMM.py ADDED Viewed

	@@ -0,0 +1,1077 @@

+#MMM.py (Multi-Mixture Model)
+#By, Chance Brownfield
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+import random
+import string
+import math
+import numpy as np
+# --- Building Blocks ---
+class Encoder(nn.Module):
+    def __init__(self, input_dim, hidden_dim, z_dim):
+        super().__init__()
+        self.fc1 = nn.Linear(input_dim, hidden_dim)
+        self.fc_mu = nn.Linear(hidden_dim, z_dim)
+        self.fc_logvar = nn.Linear(hidden_dim, z_dim)
+    def forward(self, x):
+        h = F.relu(self.fc1(x))
+        return self.fc_mu(h), self.fc_logvar(h)
+class Decoder(nn.Module):
+    def __init__(self, z_dim, hidden_dim, output_dim):
+        super().__init__()
+        self.fc1 = nn.Linear(z_dim, hidden_dim)
+        self.fc_out = nn.Linear(hidden_dim, output_dim)
+    def forward(self, z):
+        h = F.relu(self.fc1(z))
+        return torch.sigmoid(self.fc_out(h))
+class RecurrentNetwork(nn.Module):
+    def __init__(self, input_dim, hidden_dim, num_states):
+        super().__init__()
+        self.rnn = nn.LSTM(input_dim, hidden_dim, batch_first=True)
+        self.state_emissions = nn.Linear(hidden_dim, num_states)
+        self.transition_matrix = nn.Parameter(torch.randn(num_states, num_states))
+    def forward(self, x):
+        rnn_out, _ = self.rnn(x)
+        emissions = F.log_softmax(self.state_emissions(rnn_out), dim=-1)
+        transitions = F.log_softmax(self.transition_matrix, dim=-1)
+        return emissions, transitions
+class GaussianMixture(nn.Module):
+    def __init__(self, n_components, n_features):
+        super().__init__()
+        self.n_components = n_components
+        self.n_features = n_features
+        self.logits = nn.Parameter(torch.zeros(n_components))
+        self.means = nn.Parameter(torch.randn(n_components, n_features))
+        self.log_vars = nn.Parameter(torch.zeros(n_components, n_features))
+    def get_weights(self):
+        return F.softmax(self.logits, dim=0)
+    def get_means(self):
+        return self.means
+    def get_variances(self):
+        return torch.exp(self.log_vars)
+    def log_prob(self, X):
+        if not isinstance(X, torch.Tensor):
+            X = torch.tensor(X, dtype=self.means.dtype, device=self.means.device)
+        else:
+            X = X.to(self.means.device).type(self.means.dtype)
+        N, D = X.shape
+        diff = X.unsqueeze(1) - self.means.unsqueeze(0)
+        inv_vars = torch.exp(-self.log_vars)
+        exp_term = -0.5 * torch.sum(diff * diff * inv_vars.unsqueeze(0), dim=2)
+        log_norm = -0.5 * (torch.sum(self.log_vars, dim=1) + D * math.log(2 * math.pi))
+        comp_log_prob = exp_term + log_norm.unsqueeze(0)
+        log_weights = F.log_softmax(self.logits, dim=0)
+        weighted = comp_log_prob + log_weights.unsqueeze(0)
+        return torch.logsumexp(weighted, dim=1)
+    def get_log_likelihoods(self, X):
+        if not isinstance(X, torch.Tensor):
+            X = torch.tensor(X, dtype=self.means.dtype, device=self.means.device)
+        else:
+            X = X.to(self.means.device).type(self.means.dtype)
+        with torch.no_grad():
+            ll = self.log_prob(X)
+        return ll.cpu().numpy()
+    def score(self, X):
+        ll = self.get_log_likelihoods(X)
+        return float(ll.mean())
+class HiddenMarkov(nn.Module):
+    def __init__(self, n_states, n_mix, n_features):
+        super().__init__()
+        self.n_states = n_states
+        self.n_mix = n_mix
+        self.n_features = n_features
+        self.pi_logits = nn.Parameter(torch.zeros(n_states))
+        self.trans_logits = nn.Parameter(torch.zeros(n_states, n_states))
+        self.weight_logits = nn.Parameter(torch.zeros(n_states, n_mix))
+        self.means = nn.Parameter(torch.randn(n_states, n_mix, n_features))
+        self.log_vars = nn.Parameter(torch.zeros(n_states, n_mix, n_features))
+    def get_initial_prob(self):
+        return F.softmax(self.pi_logits, dim=0)
+    def get_transition_matrix(self):
+        return F.softmax(self.trans_logits, dim=1)
+    def get_weights(self):
+        return F.softmax(self.weight_logits, dim=1)
+    def get_means(self):
+        return self.means
+    def get_variances(self):
+        return torch.exp(self.log_vars)
+    def log_prob(self, X):
+        if not isinstance(X, torch.Tensor):
+            X = torch.tensor(X, dtype=self.means.dtype, device=self.means.device)
+        else:
+            X = X.to(self.means.device).type(self.means.dtype)
+        T, D = X.shape
+        diff = X.unsqueeze(1).unsqueeze(2) - self.means.unsqueeze(0)
+        inv_vars = torch.exp(-self.log_vars)
+        exp_term = -0.5 * torch.sum(diff * diff * inv_vars.unsqueeze(0), dim=3)
+        log_norm = -0.5 * (torch.sum(self.log_vars, dim=2) + D * math.log(2 * math.pi))
+        comp_log_prob = exp_term + log_norm.unsqueeze(0)
+        log_mix_weights = F.log_softmax(self.weight_logits, dim=1)
+        weighted = comp_log_prob + log_mix_weights.unsqueeze(0)
+        emission_log_prob = torch.logsumexp(weighted, dim=2)
+        log_pi = F.log_softmax(self.pi_logits, dim=0)
+        log_A = F.log_softmax(self.trans_logits, dim=1)
+        log_alpha = torch.zeros(T, self.n_states, dtype=X.dtype, device=X.device)
+        log_alpha[0] = log_pi + emission_log_prob[0]
+        for t in range(1, T):
+            prev = log_alpha[t-1].unsqueeze(1)
+            log_alpha[t] = emission_log_prob[t] + torch.logsumexp(prev + log_A, dim=1)
+        return torch.logsumexp(log_alpha[-1], dim=0)
+    def get_log_likelihoods(self, X):
+        if not isinstance(X, torch.Tensor):
+            X = torch.tensor(X, dtype=self.means.dtype, device=self.means.device)
+        else:
+            X = X.to(self.means.device).type(self.means.dtype)
+        with torch.no_grad():
+            if X.dim() == 3:
+                return [self.log_prob(seq).item() for seq in X]
+            else:
+                return [self.log_prob(X).item()]
+    def score(self, X):
+        lls = self.get_log_likelihoods(X)
+        return float(sum(lls) / len(lls))
+class TimeSeriesTransformer(nn.Module):
+    def __init__(self, input_dim, d_model, nhead, num_layers, output_dim, batch_first=True):
+        super().__init__()
+        self.input_dim = input_dim
+        self.d_model = d_model
+        self.nhead = nhead
+        self.num_encoder_layers = num_layers
+        self.output_dim = output_dim
+        self.batch_first = batch_first
+        self.input_proj = nn.Linear(input_dim, d_model)
+        self.transformer = nn.Transformer(
+            d_model=d_model,
+            nhead=nhead,
+            num_encoder_layers=num_layers,
+            num_decoder_layers=num_layers,
+            batch_first=batch_first
+        )
+        self.output_proj = nn.Linear(d_model, output_dim)
+    def forward(self, src, tgt):
+        """
+        src and tgt shapes depend on batch_first:
+         - if batch_first=True: (B, S, input_dim)
+         - if batch_first=False: (S, B, input_dim)
+        The rest of the model should pass tensors accordingly. We attempt to be permissive:
+        """
+        src_emb = self.input_proj(src)
+        tgt_emb = self.input_proj(tgt) if tgt is not None else None
+        out = self.transformer(src_emb, tgt_emb) if tgt_emb is not None else self.transformer(src_emb, src_emb)
+        return self.output_proj(out)
+class VariationalRecurrentMarkovGaussianTransformer(nn.Module):
+    """
+    Variational Encoder + RNN-HMM + Hidden GMM + Transformer hybrid.
+    """
+    def __init__(self,
+                 input_dim,
+                 hidden_dim,
+                 z_dim,
+                 rnn_hidden,
+                 num_states,
+                 n_mix,
+                 trans_d_model,
+                 trans_nhead,
+                 trans_layers,
+                 output_dim):
+        super().__init__()
+        self.output_dim = output_dim
+        self.encoder = Encoder(input_dim, hidden_dim, z_dim)
+        self.decoder = Decoder(z_dim, hidden_dim, output_dim)
+        self.rn = RecurrentNetwork(z_dim, rnn_hidden, num_states)
+        self.hm = HiddenMarkov(num_states, n_mix, z_dim)
+        self.transformer = TimeSeriesTransformer(
+            input_dim=z_dim,
+            d_model=trans_d_model,
+            nhead=trans_nhead,
+            num_layers=trans_layers,
+            output_dim=output_dim
+        )
+        self.pred_weights = nn.Parameter(torch.ones(z_dim))
+        self.recog_weights = nn.Parameter(torch.ones(z_dim))
+        self.gen_weights = nn.Parameter(torch.ones(z_dim))
+    def reparameterize(self, mu, logvar):
+        std = torch.exp(0.5 * logvar)
+        eps = torch.randn_like(std)
+        return mu + eps * std
+    def forward(self, x, tgt=None):
+        if x.dim() == 3:
+            T, B, _ = x.size()
+            zs, mus, logvars = [], [], []
+            for t in range(T):
+                mu_t, logvar_t = self.encoder(x[t])
+                z_t = self.reparameterize(mu_t, logvar_t)
+                zs.append(z_t)
+                mus.append(mu_t)
+                logvars.append(logvar_t)
+            zs = torch.stack(zs)  # (T, B, Z)
+            mus = torch.stack(mus)  # (T, B, Z)
+            logvars = torch.stack(logvars)  # (T, B, Z)
+        else:
+            mu, logvar = self.encoder(x)
+            zs = self.reparameterize(mu, logvar)
+            if zs.dim() == 1:
+                zs = zs.unsqueeze(0).unsqueeze(1)  # (1,1,Z)
+                mus = mu.unsqueeze(0).unsqueeze(1)
+                logvars = logvar.unsqueeze(0).unsqueeze(1)
+            elif zs.dim() == 2:
+                zs = zs.unsqueeze(1)
+                mus = mu.unsqueeze(1)
+                logvars = logvar.unsqueeze(1)
+            else:
+                # already (T,B,Z)
+                mus, logvars = mu, logvar
+        T, B, _ = zs.size()
+        recon = self.decoder(zs.view(-1, zs.size(-1))).view(T, B, self.output_dim)
+        try:
+            if x.dim() == 3:
+                recon = recon.view_as(x)
+            else:
+                recon = recon.view_as(x)
+        except Exception:
+            pass
+        emissions, transitions = self.rn(zs.permute(1, 0, 2))  # emissions shape (B, T, num_states)
+        Tz, Bz, Z = zs.shape
+        seq_lls = []
+        for b in range(Bz):
+            ll_b = self.hm.log_prob(zs[:, b, :])  # should be a scalar tensor (dtype/device consistent)
+            if not torch.is_tensor(ll_b):
+                ll_b = torch.tensor(ll_b, dtype=zs.dtype, device=zs.device)
+            seq_lls.append(ll_b)
+        hgmm_ll = torch.stack(seq_lls, dim=0)  # (B,)
+        trans_out = self.transformer(zs, tgt) if tgt is not None else None
+        return {
+            'reconstruction': recon,
+            'mu': mus,
+            'logvar': logvars,
+            'emissions': emissions,
+            'transitions': transitions,
+            'hgmm_log_likelihood': hgmm_ll,  # shape (B,)
+            'transformer_out': trans_out
+        }
+    def loss(self, x, outputs):
+        recon, mu, logvar = outputs['reconstruction'], outputs['mu'], outputs['logvar']
+        recon_loss = F.mse_loss(recon, x, reduction='sum')
+        kld = -0.5 * torch.sum(1 + logvar - mu.pow(2) - logvar.exp())
+        hgmm_nll = -torch.sum(outputs['hgmm_log_likelihood'])
+        return recon_loss + kld + hgmm_nll
+    def predict(self, x):
+        """
+        Given x, predict next‐step (or next‐sequence) by:
+         1) encoding to z,
+         2) reweighting latent dims by pred_weights,
+         3) decoding back to input space.
+        """
+        mu, logvar = self.encoder(x)
+        z = self.reparameterize(mu, logvar)
+        z_pred = z * torch.sigmoid(self.pred_weights)
+        return self.decoder(z_pred)
+    def predict_loss(self, x, target, reward):
+        """
+        MSE between predict(x) and target,
+        weighted by a scalar reward (+/-).
+        """
+        pred = self.predict(x)
+        loss = F.mse_loss(pred, target, reduction='mean')
+        return reward * loss
+    def recognize(self, x, tgt_z=None):
+        """
+        Recognize: map x→z, then transform to tgt_z space via transformer,
+        then decode to reconstruct in original space.
+        """
+        mu, logvar = self.encoder(x)
+        z = self.reparameterize(mu, logvar)
+        if tgt_z is not None:
+            z_in = z.unsqueeze(0)
+            tgt  = tgt_z.unsqueeze(0)
+            z_out = self.transformer(z_in, tgt).squeeze(0)
+        else:
+            z_out = z
+        z_rec = z_out * torch.sigmoid(self.recog_weights)
+        return self.decoder(z_rec)
+    def recognition_loss(self, x, target, reward):
+        """
+        Recon loss between recognize(x) and target,
+        weighted by reward.
+        """
+        rec = self.recognize(x)
+        loss = F.mse_loss(rec, target, reduction='mean')
+        return reward * loss
+    def generate(self, num_steps, batch_size=1, z0=None):
+        """
+        Generate a sequence of length num_steps by:
+         1) sampling initial z from prior (HMM's mixture),
+         2) rolling it through the RNN-HMM to get a latent trajectory,
+         3) reweight by gen_weights and decode each step.
+        """
+        pi = self.hm.get_initial_prob().detach()
+        state = torch.multinomial(pi, num_samples=batch_size, replacement=True)
+        z = []
+        for t in range(num_steps):
+            w = self.hm.get_weights()[state]  # (B, n_mix)
+            mix_idx = torch.multinomial(w, 1).squeeze(-1)
+            mu_t = self.hm.get_means()[state, mix_idx]
+            z_t  = mu_t * torch.sigmoid(self.gen_weights)
+            z.append(z_t)
+            A = self.hm.get_transition_matrix()[state]
+            state = torch.multinomial(A, 1).squeeze(-1)
+        Z = torch.stack(z, dim=0)   # (T, B, Z)
+        recon = self.decoder(Z.view(-1, Z.size(-1))).view(num_steps, batch_size, -1)
+        return recon
+    def generation_loss(self, generated, target_seq, reward):
+        """
+        Sequence‐level loss between generated and target,
+        weighted by reward (+/-).
+        """
+        loss = F.mse_loss(generated, target_seq, reduction='mean')
+        return reward * loss
+class MMTransformer(nn.Module):
+    """Multi-Mixture Transformrer."""
+    def __init__(self, n_components, n_features, model_type='gmm', n_mix=1):
+        super().__init__()
+        self.model_type = model_type.lower()
+        self.n_features = n_features
+        self.gmms = []
+        self.hgmm_models = {}
+        self.active_hmm = None
+        if self.model_type == 'gmm':
+            self.gmm = GaussianMixture(n_components, n_features)
+        elif self.model_type == 'hgmm':
+            self.hm = HiddenMarkov(n_components, n_mix, n_features)
+        else:
+            raise ValueError("model_type must be 'gmm' or 'hgmm'")
+    def _prepare_tensor(self, X):
+        return torch.tensor(X, dtype=torch.float32) if not isinstance(X, torch.Tensor) else X.float()
+    def fit(self, X, init_params=None, lr=1e-2, epochs=100, verbose=False, data_id=None):
+        if init_params is not None:
+            self.import_model(init_params)
+        X_tensor = self._prepare_tensor(X).to(next(self.parameters()).device)
+        optimizer = torch.optim.Adam(self.parameters(), lr=lr)
+        for epoch in range(epochs):
+            optimizer.zero_grad()
+            if self.model_type == 'gmm':
+                loss = -torch.mean(self.gmm.log_prob(X_tensor))
+            else:
+                if X_tensor.dim() == 3:
+                    loss = -sum(self.hm.log_prob(seq) for seq in X_tensor) / X_tensor.size(0)
+                else:
+                    loss = -self.hm.log_prob(X_tensor)
+            loss.backward()
+            optimizer.step()
+            if verbose and epoch % 10 == 0:
+                print(f"Epoch {epoch}, Loss: {loss.item():.4f}")
+        if self.model_type == 'gmm':
+            if data_id is None:
+                data_id = len(self.gmms)
+            while isinstance(data_id, int) and data_id < len(self.gmms) and self.gmms[data_id] is not None:
+                data_id += 1
+            if data_id == len(self.gmms):
+                self.gmms.append(self.gmm)
+            else:
+                self.gmms[data_id] = self.gmm
+        else:
+            if data_id is None:
+                while True:
+                    data_id = ''.join(random.choices(string.ascii_lowercase, k=6))
+                    if data_id not in self.hgmm_models:
+                        break
+            self.hgmm_models[data_id] = self.hm
+            self.active_hmm = data_id
+        return data_id
+    def unfit(self, data_id):
+        if isinstance(data_id, int):
+            if 0 <= data_id < len(self.gmms):
+                del self.gmms[data_id]
+            else:
+                raise ValueError(f"GMM with id {data_id} does not exist.")
+        elif isinstance(data_id, str):
+            if data_id in self.hgmm_models:
+                del self.hgmm_models[data_id]
+                if self.active_hmm == data_id:
+                    self.active_hmm = None
+            else:
+                raise ValueError(f"HMM model with name '{data_id}' does not exist.")
+        else:
+            raise TypeError("data_id must be an int (GMM) or str (HMM)")
+    def check_data(self):
+        data = {i: 'gmm' for i in range(len(self.gmms))}
+        data.update({name: 'hmm' for name in self.hgmm_models.keys()})
+        return data
+    def score(self, X):
+        with torch.no_grad():
+            X_tensor = self._prepare_tensor(X).to(next(self.parameters()).device)
+            if self.model_type == 'gmm':
+                return float(self.gmm.log_prob(X_tensor).mean().cpu().item())
+            else:
+                if X_tensor.dim() == 3:
+                    return float(sum(self.hm.log_prob(seq).item() for seq in X_tensor) / X_tensor.size(0))
+                else:
+                    return float(self.hm.log_prob(X_tensor).cpu().item())
+    def get_log_likelihoods(self, X):
+        with torch.no_grad():
+            X_tensor = self._prepare_tensor(X).to(next(self.parameters()).device)
+            if self.model_type == 'gmm':
+                return self.gmm.log_prob(X_tensor).cpu().numpy()
+            else:
+                if X_tensor.dim() == 3:
+                    return [self.hm.log_prob(seq).item() for seq in X_tensor]
+                else:
+                    return [self.hm.log_prob(X_tensor).item()]
+    def get_means(self):
+        return (self.gmm if self.model_type == 'gmm' else self.hgmm).get_means().cpu().detach().numpy()
+    def get_variances(self):
+        return (self.gmm if self.model_type == 'gmm' else self.hgmm).get_variances().cpu().detach().numpy()
+    def get_weights(self):
+        return (self.gmm if self.model_type == 'gmm' else self.hgmm).get_weights().cpu().detach().numpy()
+    def export_model(self, filepath=None):
+        state = self.state_dict()
+        if filepath:
+            torch.save(state, filepath)
+        return state
+    def import_model(self, source):
+        if isinstance(source, str):
+            state = torch.load(source)
+        elif isinstance(source, dict):
+            state = source
+        else:
+            raise ValueError("Unsupported source for import_model")
+        self.load_state_dict(state)
+class MMModel(nn.Module):
+    """Multi-Mixture Model."""
+    def __init__(self):
+        super().__init__()
+        self.gmms = []  # List of GaussianMixture models
+        self.hgmm_models = {}  # Dict of HM models keyed by string IDs
+        self.active_hmm = None  # Optional: active HGMM for scoring/fitting
+    def _generate_unique_id(self):
+        while True:
+            candidate = ''.join(random.choices(string.ascii_lowercase, k=6))
+            if candidate not in self.hgmm_models:
+                return candidate
+    def fit(self, data=None, model_type='gmm', n_components=1, n_features=1, n_mix=1,
+            data_id=None, init_params=None, lr=1e-2, epochs=100):
+        """
+        Fit or absorb a model:
+        - If `data` is a tensor/array, fit a new model.
+        - If `data` is a pre-trained model, absorb it directly.
+        - `data_id` determines storage; if None, generate a unique one.
+        """
+        if model_type == 'gmm':
+            if data_id is None:
+                data_id = len(self.gmms)
+                while data_id < len(self.gmms) and self.gmms[data_id] is not None:
+                    data_id += 1
+            if isinstance(data, GaussianMixture):
+                if data_id < len(self.gmms):
+                    self.gmms[data_id] = data
+                else:
+                    while len(self.gmms) < data_id:
+                        self.gmms.append(None)
+                    self.gmms.append(data)
+            else:
+                model = MMTransformer(n_components, n_features, model_type='gmm')
+                model.fit(data, init_params=init_params, lr=lr, epochs=epochs)
+                if data_id < len(self.gmms):
+                    self.gmms[data_id] = model.gmm
+                else:
+                    while len(self.gmms) < data_id:
+                        self.gmms.append(None)
+                    self.gmms.append(model.gmm)
+        elif model_type == 'hmm':
+            if data_id is None:
+                data_id = self._generate_unique_id()
+            if isinstance(data, HiddenMarkov):
+                self.hgmm_models[data_id] = data
+            else:
+                model = MMTransformer(n_components, n_features, model_type='hmm', n_mix=n_mix)
+                model.fit(data, init_params=init_params, lr=lr, epochs=epochs)
+                self.hgmm_models[data_id] = model.hm
+        else:
+            raise ValueError("model_type must be 'gmm' or 'hmm'")
+        return data_id
+    def export_model(self, data_id):
+        """
+        Export the model associated with the data_id.
+        Returns a GaussianMixture or HiddenMarkov instance.
+        """
+        if isinstance(data_id, int):
+            if 0 <= data_id < len(self.gmms):
+                return self.gmms[data_id]
+            else:
+                raise ValueError(f"GMM with id {data_id} does not exist.")
+        elif isinstance(data_id, str):
+            if data_id in self.hgmm_models:
+                return self.hgmm_models[data_id]
+            else:
+                raise ValueError(f"HMM model with name '{data_id}' does not exist.")
+        else:
+            raise TypeError("data_id must be an int (GMM) or str (HMM)")
+    def unfit(self, data_id):
+        """
+        Remove a model from the internal storage (GMM or HMM).
+        """
+        if isinstance(data_id, int):
+            if 0 <= data_id < len(self.gmms):
+                del self.gmms[data_id]
+            else:
+                raise ValueError(f"GMM with id {data_id} does not exist.")
+        elif isinstance(data_id, str):
+            if data_id in self.hgmm_models:
+                del self.hgmm_models[data_id]
+                if self.active_hmm == data_id:
+                    self.active_hmm = None
+            else:
+                raise ValueError(f"HMM model with name '{data_id}' does not exist.")
+        else:
+            raise TypeError("data_id must be an int (GMM) or str (HMM)")
+    def check_data(self):
+        """
+        Returns a dict mapping each stored data's ID to its type.
+        - Integer keys → 'gmm'
+        - String keys   → 'hmm'
+        """
+        data = {i: 'gmm' for i in range(len(self.gmms)) if self.gmms[i] is not None}
+        data.update({name: 'hmm' for name in self.hgmm_models.keys()})
+        return data
+    def _all_ids(self):
+        return list(self.check_data().keys())
+    def _normalize_ids(self, data_ids):
+        if data_ids is None:
+            return self._all_ids()
+        if isinstance(data_ids, (int, str)):
+            return [data_ids]
+        return list(data_ids)
+    def _get_submodel(self, data_id):
+        if isinstance(data_id, int):
+            return self.gmms[data_id]
+        return self.hgmm_models[data_id]
+    def get_means(self, data_ids=None):
+        """
+        If data_ids is None, returns a dict {id: means} for all components;
+        if a single id, returns just that component's means (numpy array);
+        if a list/tuple, returns a dict.
+        """
+        ids = self._normalize_ids(data_ids)
+        out = {d: self._get_submodel(d).get_means() for d in ids}
+        if isinstance(data_ids, (int, str)):
+            return out[ids[0]]
+        return out
+    def get_variances(self, data_ids=None):
+        ids = self._normalize_ids(data_ids)
+        out = {d: self._get_submodel(d).get_variances() for d in ids}
+        if isinstance(data_ids, (int, str)):
+            return out[ids[0]]
+        return out
+    def get_weights(self, data_ids=None):
+        ids = self._normalize_ids(data_ids)
+        out = {d: self._get_submodel(d).get_weights() for d in ids}
+        if isinstance(data_ids, (int, str)):
+            return out[ids[0]]
+        return out
+    def score(self, X, data_ids=None):
+        """
+        Average log-likelihood(s) of X under each specified component.
+        """
+        ids = self._normalize_ids(data_ids)
+        out = {d: self._get_submodel(d).score(X) for d in ids}
+        if isinstance(data_ids, (int, str)):
+            return out[ids[0]]
+        return out
+    def get_log_likelihoods(self, X, data_ids=None):
+        """
+        Per-sample log-likelihood(s) of X under each specified component.
+        """
+        ids = self._normalize_ids(data_ids)
+        out = {d: self._get_submodel(d).get_log_likelihoods(X) for d in ids}
+        if isinstance(data_ids, (int, str)):
+            return out[ids[0]]
+        return out
+class MMM(nn.Module):
+    """
+    Manager for multiple models: GMM, HMM, and VariationalRecurrentMarkovGaussianTransformer.
+    This version uses MSE for reconstruction, gradient clipping, variance clamping, numerical safeguards, and optional annealing.
+    """
+    def __init__(self):
+        super().__init__()
+        self.models = nn.ModuleDict()
+    def _generate_unique_id(self, prefix='model'):
+        while True:
+            candidate = f"{prefix}_{''.join(random.choices(string.ascii_lowercase, k=6))}"
+            if candidate not in self.models:
+                return candidate
+    def add_model(self, model: nn.Module, model_id: str = None):
+        if model_id is None:
+            model_id = self._generate_unique_id(model.__class__.__name__)
+        if model_id in self.models:
+            raise KeyError(f"Model with id '{model_id}' already exists.")
+        self.models[model_id] = model
+        return model_id
+    def fit_and_add(self,
+                    data,
+                    model_type: str = 'gmm',
+                    model_id: str = None,
+                    kl_anneal_epochs: int = 0,
+                    clip_norm: float = 5.0,
+                    weight_decay: float = 1e-5,
+                    **kwargs):
+        model_type = model_type.lower()
+        if model_type in ('gmm','hmm'):
+            mm = MMModel()
+            mm.fit(data, model_type=model_type, **kwargs)
+            model = mm
+        elif model_type == 'mmm':
+            # build hybrid model
+            model = VariationalRecurrentMarkovGaussianTransformer(
+                kwargs.pop('input_dim'),
+                kwargs.pop('hidden_dim'),
+                kwargs.pop('z_dim'),
+                kwargs.pop('rnn_hidden'),
+                kwargs.pop('num_states'),
+                kwargs.pop('n_mix'),
+                kwargs.pop('trans_d_model'),
+                kwargs.pop('trans_nhead'),
+                kwargs.pop('trans_layers'),
+                kwargs.pop('output_dim')
+            )
+            optim = torch.optim.Adam(model.parameters(), lr=kwargs.get('lr',1e-4), weight_decay=weight_decay)
+            epochs = kwargs.get('epochs',100)
+            x = data.float().to(next(model.parameters()).device)
+            for epoch in range(epochs):
+                model.train()
+                optim.zero_grad()
+                out = model(x, kwargs.get('tgt', None))
+                recon = out['reconstruction']
+                recon_loss = F.mse_loss(recon, x, reduction='sum')
+                mu, logvar = out['mu'], out['logvar']
+                logvar_clamped = torch.clamp(logvar, min=-10.0, max=10.0)
+                kld = -0.5 * torch.sum(1 + logvar_clamped - mu.pow(2) - logvar_clamped.exp())
+                hgmm_ll = out['hgmm_log_likelihood']
+                hgmm_ll = torch.clamp(hgmm_ll, min=-1e6, max=1e6)
+                hgmm_nll = -torch.sum(hgmm_ll)
+                kld = torch.nan_to_num(kld, nan=0.0, posinf=1e8, neginf=-1e8)
+                hgmm_nll = torch.nan_to_num(hgmm_nll, nan=0.0, posinf=1e8, neginf=-1e8)
+                anneal_w = min(1.0, epoch / kl_anneal_epochs) if kl_anneal_epochs > 0 else 1.0
+                loss = recon_loss + anneal_w * (kld + hgmm_nll)
+                loss.backward()
+                torch.nn.utils.clip_grad_norm_(model.parameters(), clip_norm)
+                optim.step()
+                if epoch % max(1, epochs // 5) == 0:
+                    print(f"Epoch {epoch}: recon={recon_loss.item():.1f}, kld={kld.item():.1f}, "
+                          f"hmll={hgmm_nll.item():.1f}, anneal_w={anneal_w:.2f}")
+        else:
+            raise ValueError("model_type must be 'gmm','hmm', or 'mmm'")
+        assigned_id = self.add_model(model, model_id)
+        return assigned_id
+    def export_model(self, model_id: str, filepath: str = None):
+        if model_id not in self.models:
+            raise KeyError(f"Model '{model_id}' not found.")
+        model = self.models[model_id]
+        state = model.state_dict()
+        if filepath:
+            torch.save(state, filepath)
+        return state
+    def import_model(self, model_id: str, source):
+        if model_id not in self.models:
+            raise KeyError(f"Model '{model_id}' not found.")
+        model = self.models[model_id]
+        if isinstance(source, str):
+            state = torch.load(source)
+        elif isinstance(source, dict):
+            state = source
+        else:
+            raise ValueError("source must be filepath or state dict")
+        model.load_state_dict(state)
+    def _select_data(self, mm, fn, data_ids=None, *args, **kwargs):
+        all_keys = list(mm.check_data().keys())
+        if data_ids is None:
+            ids = all_keys
+        elif isinstance(data_ids, (list, tuple)):
+            ids = data_ids
+        else:
+            ids = [data_ids]
+        out = {d: fn(mm, d, *args, **kwargs) for d in ids}
+        if not isinstance(data_ids, (list, tuple)) and data_ids is not None:
+            return out[data_ids]
+        return out
+    def get_means(self, model_id: str, data_ids=None):
+        mm = self.get_mmm(model_id)
+        return self._select_data(
+            mm,
+            lambda m, d: m._get_submodel(d).get_means(),
+            data_ids
+        )
+    def get_variances(self, model_id: str, data_ids=None):
+        mm = self.get_mmm(model_id)
+        return self._select_data(
+            mm,
+            lambda m, d: m._get_submodel(d).get_variances(),
+            data_ids
+        )
+    def get_weights(self, model_id: str, data_ids=None):
+        mm = self.get_mmm(model_id)
+        return self._select_data(
+            mm,
+            lambda m, d: m._get_submodel(d).get_weights(),
+            data_ids
+        )
+    def get_log_likelihoods(self, model_id: str, X, data_ids=None):
+        mm = self.get_mmm(model_id)
+        def fn(m, d):
+            sub = m._get_submodel(d)
+            return sub.get_log_likelihoods(X)
+        return self._select_data(mm, fn, data_ids)
+    def score(self, model_id: str, X, data_ids=None):
+        mm = self.get_mmm(model_id)
+        def fn(m, d):
+            sub = m._get_submodel(d)
+            return sub.score(X)
+        return self._select_data(mm, fn, data_ids)
+    def get_mmm(self, model_id: str):
+        if model_id not in self.models:
+            raise KeyError(f"Model '{model_id}' not found.")
+        return self.models[model_id]
+    def save(self, path: str):
+        torch.save(self, path)
+    @classmethod
+    def load(cls, path: str):
+        return torch.load(path, weights_only=False)
+class WeightedMMM(MMM):
+    """
+    Enhanced Multi-Mixture Model with weighted predictions and GPU acceleration support.
+    Supports training with reward/punishment signals.
+    """
+    def __init__(self, device=None):
+        super().__init__()
+        self.device = device if device is not None else torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+        self.weighted_models = {}  # Store models with their weights
+        self.reward_signals = {}   # Store reward signals for each model
+        self.punishment_signals = {}  # Store punishment signals for each model
+    def to_device(self, model):
+        """Move model to specified device (CPU/GPU)"""
+        return model.to(self.device)
+    def fit_with_weights(self,
+                        data,
+                        reward_signals,
+                        punishment_signals,
+                        model_type='gmm',
+                        model_id=None,
+                        reward_weight=1.0,
+                        punishment_weight=1.0,
+                        **kwargs):
+        """
+        Fit model with weighted predictions using reward and punishment signals.
+        Args:
+            data: Input sensor data
+            reward_signals: Positive reinforcement signals
+            punishment_signals: Negative reinforcement signals
+            model_type: Type of model ('gmm', 'hmm', or 'mmm')
+            model_id: Optional model identifier
+            reward_weight: Weight for reward signals
+            punishment_weight: Weight for punishment signals
+            **kwargs: Additional training parameters
+        """
+        data = torch.tensor(data, dtype=torch.float32).to(self.device)
+        reward_signals = torch.tensor(reward_signals, dtype=torch.float32).to(self.device)
+        punishment_signals = torch.tensor(punishment_signals, dtype=torch.float32).to(self.device)
+        baseline_id = self.fit_and_add(data, model_type=model_type, model_id=model_id, **kwargs)
+        baseline_model = self.models[baseline_id]
+        weighted_model = self._create_weighted_model(baseline_model, model_type)
+        weighted_model = self.to_device(weighted_model)
+        self.reward_signals[baseline_id] = reward_signals
+        self.punishment_signals[baseline_id] = punishment_signals
+        self.weighted_models[baseline_id] = {
+            'model': weighted_model,
+            'reward_weight': reward_weight,
+            'punishment_weight': punishment_weight
+        }
+        self._train_weighted_model(baseline_id, data, reward_signals, punishment_signals, **kwargs)
+        return baseline_id
+    def _create_weighted_model(self, baseline_model, model_type):
+        """Create a weighted version of the baseline model"""
+        if model_type == 'gmm':
+            return GaussianMixture(
+                n_components=baseline_model.n_components,
+                n_features=baseline_model.n_features
+            )
+        elif model_type == 'hmm':
+            return HiddenMarkov(
+                n_states=baseline_model.n_states,
+                n_mix=baseline_model.n_mix,
+                n_features=baseline_model.n_features
+            )
+        elif model_type == 'mmm':
+            return VariationalRecurrentMarkovGaussianTransformer(
+                input_dim=baseline_model.encoder.fc1.in_features,
+                hidden_dim=baseline_model.encoder.fc1.out_features,
+                z_dim=baseline_model.encoder.fc_mu.out_features,
+                rnn_hidden=baseline_model.rn.rnn.hidden_size,
+                num_states=baseline_model.rn.state_emissions.out_features,
+                n_mix=baseline_model.hm.n_mix,
+                trans_d_model=baseline_model.transformer.d_model,
+                trans_nhead=baseline_model.transformer.nhead,
+                trans_layers=baseline_model.transformer.num_encoder_layers,
+                output_dim=baseline_model.transformer.output_proj.out_features
+            )
+        else:
+            raise ValueError(f"Unsupported model type: {model_type}")
+    def _train_weighted_model(self, model_id, data, reward_signals, punishment_signals, **kwargs):
+        """Train the weighted model using reward and punishment signals"""
+        weighted_info = self.weighted_models[model_id]
+        model = weighted_info['model']
+        reward_weight = weighted_info['reward_weight']
+        punishment_weight = weighted_info['punishment_weight']
+        device = next(model.parameters()).device if any(p.requires_grad for p in model.parameters()) else self.device
+        optimizer = torch.optim.Adam(model.parameters(), lr=kwargs.get('lr', 1e-4))
+        epochs = kwargs.get('epochs', 100)
+        reward_signals = torch.as_tensor(reward_signals, dtype=torch.float32, device=device).detach()
+        punishment_signals = torch.as_tensor(punishment_signals, dtype=torch.float32, device=device).detach()
+        for epoch in range(epochs):
+            model.train()
+            optimizer.zero_grad()
+            if isinstance(model, (GaussianMixture, HiddenMarkov)):
+                log_probs = model.log_prob(data)
+                if not torch.is_tensor(log_probs):
+                    log_probs = torch.as_tensor(log_probs, dtype=torch.float32, device=device)
+            else:
+                outputs = model(data)
+                log_probs = outputs['hgmm_log_likelihood']  # expected shape (B,)
+            if log_probs.dim() > 1:
+                log_probs = log_probs.view(log_probs.size(0), -1).mean(dim=1)
+            log_probs = log_probs.to(device).type(torch.float32)
+            N = log_probs.numel()
+            def _broadcast_signal(sig):
+                if sig.numel() == 1:
+                    return sig.expand(N)
+                if sig.numel() == N:
+                    return sig.view(N)
+                try:
+                    return sig.expand(N)
+                except Exception:
+                    raise ValueError(f"Signal of length {sig.numel()} cannot be broadcast to {N} samples")
+            r = _broadcast_signal(reward_signals)
+            p = _broadcast_signal(punishment_signals)
+            reward_loss = -torch.mean(log_probs * r) * reward_weight
+            punishment_loss = torch.mean(log_probs * p) * punishment_weight
+            total_loss = reward_loss + punishment_loss
+            if not torch.isfinite(total_loss):
+                print("Warning: non-finite total_loss detected; skipping update and reducing LR.")
+                for g in optimizer.param_groups:
+                    g['lr'] = max(1e-8, g['lr'] * 0.1)
+                continue
+            total_loss.backward()
+            torch.nn.utils.clip_grad_norm_(model.parameters(), max_norm=5.0)
+            optimizer.step()
+            if epoch % max(1, epochs // 5) == 0:
+                print(f"Epoch {epoch}: reward_loss={reward_loss.item():.6f}, punishment_loss={punishment_loss.item():.6f}")
+    def predict_anomalies(self, data, model_id, threshold=0.95):
+        """
+        Predict anomalies using both baseline and weighted models.
+        Args:
+            data: Input sensor data
+            model_id: Model identifier
+            threshold: Anomaly detection threshold
+        Returns:
+            dict containing:
+            - baseline_predictions: Anomaly predictions from baseline model
+            - weighted_predictions: Anomaly predictions from weighted model
+            - confidence_scores: Confidence scores for predictions
+        """
+        data = torch.tensor(data, dtype=torch.float32).to(self.device)
+        baseline_model = self.models[model_id]
+        baseline_log_probs = baseline_model.log_prob(data)
+        baseline_predictions = (baseline_log_probs < threshold).cpu().numpy()
+        weighted_model = self.weighted_models[model_id]['model']
+        weighted_log_probs = weighted_model.log_prob(data)
+        weighted_predictions = (weighted_log_probs < threshold).cpu().numpy()
+        confidence_scores = {
+            'baseline': torch.sigmoid(baseline_log_probs).cpu().numpy(),
+            'weighted': torch.sigmoid(weighted_log_probs).cpu().numpy()
+        }
+        return {
+            'baseline_predictions': baseline_predictions,
+            'weighted_predictions': weighted_predictions,
+            'confidence_scores': confidence_scores
+        }
+    def evaluate_models(self, test_data, test_labels, model_id):
+        """
+        Evaluate and compare baseline and weighted models.
+        Args:
+            test_data: Test sensor data
+            test_labels: Ground truth labels
+            model_id: Model identifier
+        Returns:
+            dict containing evaluation metrics for both models
+        """
+        predictions = self.predict_anomalies(test_data, model_id)
+        def calculate_metrics(preds, labels):
+            tp = np.sum((preds == 1) & (labels == 1))
+            fp = np.sum((preds == 1) & (labels == 0))
+            tn = np.sum((preds == 0) & (labels == 0))
+            fn = np.sum((preds == 0) & (labels == 1))
+            accuracy = (tp + tn) / (tp + tn + fp + fn)
+            precision = tp / (tp + fp) if (tp + fp) > 0 else 0
+            recall = tp / (tp + fn) if (tp + fn) > 0 else 0
+            f1 = 2 * (precision * recall) / (precision + recall) if (precision + recall) > 0 else 0
+            return {
+                'accuracy': accuracy,
+                'precision': precision,
+                'recall': recall,
+                'f1_score': f1,
+                'false_alarm_rate': fp / (fp + tn) if (fp + tn) > 0 else 0
+            }
+        baseline_metrics = calculate_metrics(predictions['baseline_predictions'], test_labels)
+        weighted_metrics = calculate_metrics(predictions['weighted_predictions'], test_labels)
+        return {
+            'baseline': baseline_metrics,
+            'weighted': weighted_metrics
+        }

mmm.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6defbe66414e745bab36dde7cb0684e46f25969429daa5e66780c7fb21c173fd
+size 5222802