Upload folder using huggingface_hub

Files changed (7) hide show

README.md ADDED Viewed

+# LFM2-Audio Arabic TTS
+## Loading
+```python
+from liquid_audio import LFM2AudioModel, LFM2AudioProcessor
+import torch
+# Load base model and processor
+processor = LFM2AudioProcessor.from_pretrained("LiquidAI/LFM2-Audio-1.5B")
+model = LFM2AudioModel.from_pretrained("LiquidAI/LFM2-Audio-1.5B").eval().cuda()
+# Load fine-tuned weights
+state_dict = torch.load("pytorch_model.bin")
+model.load_state_dict(state_dict)
+```
+Training: Stage 1 (Depthformer only), 10 epochs, Audio loss: 0.058

config.json ADDED Viewed

+{
+  "architectures": [
+    "Lfm2Model"
+  ],
+  "block_auto_adjust_ff_dim": true,
+  "block_dim": 2048,
+  "block_ff_dim": 12288,
+  "block_ffn_dim_multiplier": 1,
+  "block_mlp_init_scale": 1,
+  "block_multiple_of": 256,
+  "block_norm_eps": 1e-05,
+  "block_out_init_scale": 1,
+  "block_use_swiglu": true,
+  "block_use_xavier_init": true,
+  "bos_token_id": 1,
+  "conv_L_cache": 3,
+  "conv_bias": false,
+  "conv_dim": 2048,
+  "conv_dim_out": 2048,
+  "conv_use_xavier_init": true,
+  "dtype": "bfloat16",
+  "eos_token_id": 7,
+  "hidden_size": 2048,
+  "initializer_range": 0.02,
+  "intermediate_size": 12288,
+  "layer_types": [
+    "conv",
+    "conv",
+    "full_attention",
+    "conv",
+    "conv",
+    "full_attention",
+    "conv",
+    "conv",
+    "full_attention",
+    "conv",
+    "full_attention",
+    "conv",
+    "full_attention",
+    "conv",
+    "full_attention",
+    "conv"
+  ],
+  "max_position_embeddings": 128000,
+  "model_type": "lfm2",
+  "norm_eps": 1e-05,
+  "num_attention_heads": 32,
+  "num_heads": 32,
+  "num_hidden_layers": 16,
+  "num_key_value_heads": 8,
+  "pad_token_id": 0,
+  "rope_theta": 1000000,
+  "transformers_version": "4.57.3",
+  "use_cache": true,
+  "use_pos_enc": true,
+  "vocab_size": 65536
+}

lfm/config.json ADDED Viewed

+{
+  "architectures": [
+    "Lfm2Model"
+  ],
+  "block_auto_adjust_ff_dim": true,
+  "block_dim": 2048,
+  "block_ff_dim": 12288,
+  "block_ffn_dim_multiplier": 1,
+  "block_mlp_init_scale": 1,
+  "block_multiple_of": 256,
+  "block_norm_eps": 1e-05,
+  "block_out_init_scale": 1,
+  "block_use_swiglu": true,
+  "block_use_xavier_init": true,
+  "bos_token_id": 1,
+  "conv_L_cache": 3,
+  "conv_bias": false,
+  "conv_dim": 2048,
+  "conv_dim_out": 2048,
+  "conv_use_xavier_init": true,
+  "dtype": "bfloat16",
+  "eos_token_id": 7,
+  "hidden_size": 2048,
+  "initializer_range": 0.02,
+  "intermediate_size": 12288,
+  "layer_types": [
+    "conv",
+    "conv",
+    "full_attention",
+    "conv",
+    "conv",
+    "full_attention",
+    "conv",
+    "conv",
+    "full_attention",
+    "conv",
+    "full_attention",
+    "conv",
+    "full_attention",
+    "conv",
+    "full_attention",
+    "conv"
+  ],
+  "max_position_embeddings": 128000,
+  "model_type": "lfm2",
+  "norm_eps": 1e-05,
+  "num_attention_heads": 32,
+  "num_heads": 32,
+  "num_hidden_layers": 16,
+  "num_key_value_heads": 8,
+  "pad_token_id": 0,
+  "rope_theta": 1000000,
+  "transformers_version": "4.57.3",
+  "use_cache": true,
+  "use_pos_enc": true,
+  "vocab_size": 65536
+}

lfm/model.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:84e0ba68a67d4d1ad2e4ec8eea771758b00992017e543cfe7d5cfcb60b648fe1
+size 2340697048

model.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:84e0ba68a67d4d1ad2e4ec8eea771758b00992017e543cfe7d5cfcb60b648fe1
+size 2340697048

pytorch_model.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:51d2fbbe61007e1bdec8960180e0da756a820bca22cea7cd2ad305dd1dfc78bd
+size 2907408335

training_state.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:d65906fe5294c57051eb3fc3649a8103fdc801a054994a41240cf9b4f376d76c
+size 404961569