| { | |
| "model_name": "ai-coder-v1", | |
| "model_type": "llama", | |
| "vocab_size": 10000, | |
| "n_positions": 2048, | |
| "n_ctx": 2048, | |
| "n_embd": 512, | |
| "n_layer": 6, | |
| "n_head": 8, | |
| "n_kv_head": 4, | |
| "rotary_dim": 64, | |
| "activation_function": "swiglu", | |
| "layer_norm_epsilon": 1e-05, | |
| "initializer_range": 0.02, | |
| "use_cache": true, | |
| "rope_scaling": { | |
| "type": "dynamic", | |
| "factor": 2.0 | |
| }, | |
| "sliding_window": 1024, | |
| "attention_config": { | |
| "type": "multi_query", | |
| "head_dim": 64, | |
| "kv_heads": 4, | |
| "sliding_window": 1024, | |
| "attention_dropout": 0.1 | |
| }, | |
| "architectures": [ | |
| "LlamaForCausalLM" | |
| ], | |
| "tokenizer_class": "CodeTokenizer", | |
| "tie_word_embeddings": true, | |
| "torch_dtype": "bfloat16", | |
| "transformers_version": "4.37.0", | |
| "flash_attention": false, | |
| "gradient_checkpointing": false, | |
| "use_memory_efficient_attention": false, | |
| "parallel_attention": false, | |
| "learning_config": { | |
| "online_learning": { | |
| "enabled": false, | |
| "learning_rate": 0.0001, | |
| "batch_size": 16, | |
| "max_steps": 100, | |
| "warmup_steps": 10 | |
| }, | |
| "meta_learning": { | |
| "enabled": false, | |
| "inner_learning_rate": 0.001, | |
| "outer_learning_rate": 0.0001, | |
| "num_inner_steps": 3, | |
| "num_outer_steps": 10 | |
| }, | |
| "active_learning": { | |
| "enabled": true, | |
| "uncertainty_threshold": 0.8, | |
| "max_queries_per_session": 5, | |
| "min_confidence_score": 0.6 | |
| }, | |
| "knowledge_distillation": { | |
| "enabled": true, | |
| "temperature": 2.0, | |
| "alpha": 0.5, | |
| "teacher_models": [ | |
| "gpt-4", | |
| "claude-3" | |
| ] | |
| }, | |
| "feedback_learning": { | |
| "enabled": true, | |
| "feedback_buffer_size": 1000, | |
| "min_feedback_samples": 50, | |
| "update_interval": 100 | |
| }, | |
| "optimization": { | |
| "optimizer": "adamw", | |
| "weight_decay": 0.01, | |
| "learning_rate_scheduler": "cosine", | |
| "warmup_ratio": 0.1, | |
| "gradient_clip_val": 1.0 | |
| } | |
| }, | |
| "advanced_features": { | |
| "code_completion": true, | |
| "type_inference": true, | |
| "semantic_analysis": true, | |
| "refactoring": true, | |
| "bug_detection": true, | |
| "security_analysis": true, | |
| "performance_optimization": true, | |
| "style_checking": true, | |
| "documentation_generation": true, | |
| "test_generation": true, | |
| "multi_language_support": true, | |
| "framework_detection": true | |
| } | |
| } | |