Delete config.json

Files changed (1) hide show

config.json DELETED Viewed

@@ -1,50 +0,0 @@
-{
-  "model_name": "Xoron-Dev-MultiMoE",
-  "hidden_size": 1024,
-  "num_layers": 12,
-  "num_heads": 16,
-  "intermediate_size": 2048,
-  "vocab_size": 151643,
-  "max_position_embeddings": 131072,
-  "use_sliding_window": true,
-  "sliding_window": 4096,
-  "use_moe": true,
-  "num_experts": 8,
-  "num_experts_per_tok": 2,
-  "moe_layer_freq": 2,
-  "router_aux_loss_coef": 0.1,
-  "vision_model_name": "openai/clip-vit-base-patch16",
-  "freeze_vision": false,
-  "num_vision_tokens": 64,
-  "max_video_frames": 32,
-  "enable_generation": true,
-  "generation_image_size": 256,
-  "generation_video_size": 256,
-  "generation_latent_channels": 4,
-  "generation_base_channels": 128,
-  "generation_inference_steps": 8,
-  "tokenizer_name": "Qwen/Qwen2.5-1.5B",
-  "use_lora": true,
-  "lora_r": 32,
-  "lora_alpha": 64,
-  "lora_dropout": 0.05,
-  "lora_target_modules": [
-    "q_proj",
-    "k_proj",
-    "v_proj",
-    "o_proj",
-    "gate_proj",
-    "up_proj",
-    "down_proj"
-  ],
-  "train_lora_only": false,
-  "use_cross_attention": true,
-  "cross_attention_layers": 4,
-  "cross_attention_heads": 8,
-  "cross_attention_dropout": 0.1,
-  "use_flash_attention": true,
-  "output_dir": "./xoron-model",
-  "has_audio_encoder": true,
-  "has_audio_decoder": true,
-  "lora_applied": true
-}