{ "model_type": "wildnerve_tlm01", "architectures": ["Wildnerve_tlm01"], "SELECTED_MODEL": ["model_Custm.py", "model_PrTr.py"], "MODEL_NAME": "Wildnerve-tlm01_Hybrid_Model", "BASE_DATA_DIR": "data", "FILE_FORMATS": ["csv", "json", "txt"], "MAX_SEQ_LENGTH": 767, "SIMILARITY_THRESHOLD": 0.85, "DATASET_PATHS": { "general": ["data/general.json"], "programming_software_dev": ["data/programming_software_dev.json"], "python": [ "data/python_mbpp.json", "data/python_programming.json", "data/python_transformer_model.json" ], "rust": [ "data/rust_ai_language_model.json", "data/rust_blockchain.json", "data/rust_mbrp.json", "data/rust_programming.json" ], "solidity": ["data/solidity_programming.json"], "computer": [ "data/computer_advanced_debugging.json", "data/computer_agenticAI.json", "data/computer_architecture.json", "data/computer_cloud_security.json", "data/computer_cloudCI-CD.json", "data/computer_creativity.json", "data/computer_crossplatform.json", "data/computer_cybersecurity.json", "data/computer_error_handling_examples.json", "data/computer_gitInstruct.json" ], "cpp": [ "data/cpp_ai_language_model.json", "data/cpp_blockchain.json", "data/cpp_mbcppp.json", "data/cpp_programming.json" ], "go": [ "data/golang_ai_language_model.json", "data/golang_mbgp.json", "data/golang_programming.json" ], "java": [ "data/java_ai_language_model.json", "data/java_blockchain.json", "data/java_mbjp.json", "data/java_programming.json", "data/java_transformer_language_model.json" ], "javascript": [ "data/javascript_chatbot.json", "data/javascript_n_Typescript_backend.json", "data/javascript_n_Typescript_frontend.json", "data/javascript_n_Typescript_programming.json" ], "mathematics": [ "data/mathematics.json", "data/mathematics_training.json" ], "nim": [ "data/nim_ai_language_model.json", "data/nim_blockchain.json", "data/nim_chatbot.json", "data/nim_conversation.json", "data/nim_mbnp.json", "data/nim_programming.json" ], "other_information": ["data/other_information.json"], "physics": [ "data/physics_n_engineering.json", "data/physics_n_engineering_applied.json", "data/project_structure.json", "data/python_chatbot_guide.json" ] }, "LAZY_LOADING_ENABLED": true, "MAX_INITIAL_SPECIALIZATIONS": 2, "train_file_path": "data/computer_advanced_debugging.json", "NUM_EPOCHS": 50, "LEARNING_RATE": 0.0001, "INPUT_SIZE": 768, "OUTPUT_SIZE": 768, "SPECIALIZATIONS": [ "python", "rust", "solidity", "computer", "cpp", "go", "java", "javascript", "mathematics", "nim", "other_information", "physics" ], "PREPROCESSING": { "LOWERCASE": true, "REMOVE_SPECIAL_CHARACTERS": true, "REPLACE_MULTIPLE_SPACES": true }, "STDP_CONFIG": { "WEIGHT_THRESHOLD": 0.5, "ACTIVATION_THRESHOLD": 0.2, "USE_SNN": true, "ALPHA": 0.1, "BETA": 0.2, "BASE_DIR": "checkpoints", "SNN_FILENAME_FORMAT": "snn_model_{specialization}_{epoch}.pt", "STDPLearningRate": 0.01, "STDPMemDecay": 0.9, "SpikeThreshold": 0.5, "firing_rate": 10, "MAX_SEQ_LENGTH": 2048, "STDP_PRETRAIN_EPOCHS": 5, "STDP_FINETUNE_EPOCHS": 3, "BATCH_SIZE_PRETRAIN": 32, "BATCH_SIZE_FINETUNE": 16, "NUM_NEURONS": 1024, "MAX_RATE": 100 }, "TRAINING_CONFIG": { "PATIENCE": 3, "DELTA": 0.001, "VERBOSE": true, "NUM_EPOCHS": 20, "LEARNING_RATE": 0.0001, "TRANSFORMER_LEARNING_RATE": 5e-5, "TRANSFORMER_NUM_EPOCHS": 20 }, "CHECKPOINT_CONFIG": { "PATH": "checkpoints", "BASE_DIR": "checkpoints", "TRANSFORMER_FILENAME_FORMAT": "transformer_model_{specialization}_{epoch}.pt", "SNN_FILENAME_FORMAT": "snn_model_{specialization}_{epoch}.pt" }, "GENERATION_CONFIG": { "temperature": 0.7, "top_p": 0.9, "num_return_sequences": 1 }, "TOKENIZER_CONFIG": { "MODEL_NAME": "gpt2", "MAX_SEQ_LENGTH": 1024, "POOLING_MODE": "last" }, "DATA_LOADER_CONFIG": { "BATCH_SIZE": 32, "NUM_WORKERS": 0, "SHUFFLE": true, "INCLUDE_CRAWL": true }, "ATTENTION_CONFIG": { "WINDOW_SIZE": 256, "STRIDE": 128, "MEMORY_SIZE": 64, "NUM_HEADS": 8, "ATTENTION_DROPOUT": 0.1, "ATTENTION_TYPES": { "SLIDING": true, "HIERARCHICAL": true, "GLOBAL": true }, "PROMPT_THRESHOLDS": { "LENGTH_THRESHOLD": 500, "COMPLEXITY_THRESHOLD": 0.7, "PERPLEXITY_THRESHOLD": 50 }, "ATTENTION_WEIGHTS": { "SHORT_COMPLEX": { "SLIDING": 0.4, "HIERARCHICAL": 0.6 }, "LONG_CONTEXT": { "SLIDING": 0.3, "HIERARCHICAL": 0.4, "GLOBAL": 0.3 } } }, "TRANSFORMER_CONFIG": { "TEST_MODE": false, "LOGGING_LEVEL": "INFO", "LOG_FILE": "logs/training.log", "SAVE_CHECKPOINTS": true, "BASE_DIR": "checkpoints", "TRANSFORMER_FILENAME_FORMAT": "transformer_model_{specialization}_{epoch}.pt", "MODEL_NAME": "gpt2", "MAX_SEQ_LENGTH": 767, "NUM_EPOCHS": 20, "LEARNING_RATE": 5e-5, "BATCH_SIZE": 32, "EMBEDDING_DIM": 768, "NUM_HEADS": 12, "HIDDEN_DIM": 768, "NUM_LAYERS": 12, "DROPOUT": 0.1, "specialization1": "cpp", "specialization2": "java", "specialization3": "go", "specialization4": "javascript", "specialization5": "nim", "specialization6": "python", "specialization7": "rust", "specialization8": "solidity", "specialization9": "computer", "specialization10": "mathematics", "specialization11": "physics", "specialization12": "other_information", "DATASET_PATH": "data/cpp_ai_language_model.json", "OUTPUT_SIZE": 768, "POOLING_MODE": "mean", "VOCAB_SIZE": 50257, "MAX_RATE": 100, "MODE": "pretrained", "MODE2": "custom", "SHUFFLE": true, "SIMILARITY_THRESHOLD": 0.85, "USE_PRETRAINED_ENCODER": true, "ATTENTION_MECHANISM": { "TYPE": "hybrid", "WINDOW_SIZE": 1024, "STRIDE": 512, "USE_MEMORY": true } }, "DUAL_ENCODER_CONFIG": { "USE_PRETRAINED_ENCODER": true, "USE_CUSTOM_ENCODER": true, "DEBUG": false }, "PROMPT_ANALYZER_CONFIG": { "MODEL_NAME": "gpt2", "DATASET_PATH": null, "SPECIALIZATION": null, "HIDDEN_DIM": 768, "MAX_CACHE_SIZE": 10 }, "MODEL_PRIORITY": { "PRIMARY": "model_Custm", "SECONDARY": "model_PrTr", "USE_PRETRAINED_FALLBACK": true }, "MAX_ACTIVE_MODELS": 5, "MODEL_IDLE_THRESHOLD": 600, "MAX_MEMORY_USAGE": 0.8, "TOP_K": 3, "TOPIC_KEYWORDS": { "programming": ["python", "java", "javascript", "typescript", "rust", "go", "golang", "c++", "cpp", "c#", "ruby", "php", "perl", "swift", "kotlin", "scala", "html", "css", "sql", "database", "code", "function", "class", "method", "algorithm", "data structure", "api", "http", "rest", "graphql", "json"], "computer_science": ["algorithm", "complexity", "big o", "data structure", "graph", "tree", "hash table", "linked list", "stack", "queue", "heap", "binary search", "sorting", "recursion", "dynamic programming", "greedy algorithm", "backtracking", "computational", "turing"], "software_engineering": ["design pattern", "architecture", "solid principles", "agile", "scrum", "kanban", "waterfall", "ci/cd", "continuous integration", "continuous deployment", "testing", "unit test", "integration test", "e2e test", "test-driven", "tdd", "bdd"], "web_development": ["frontend", "backend", "full-stack", "web app", "spa", "pwa", "responsive", "mobile-first", "css framework", "react", "angular", "vue", "svelte", "next.js"] } }