WildnerveAI's picture
Upload config.json
928a969 verified
{
"model_type": "wildnerve_tlm01",
"architectures": ["Wildnerve_tlm01"],
"SELECTED_MODEL": ["model_Custm.py", "model_PrTr.py"],
"MODEL_NAME": "Wildnerve-tlm01_Hybrid_Model",
"BASE_DATA_DIR": "data",
"FILE_FORMATS": ["csv", "json", "txt"],
"MAX_SEQ_LENGTH": 767,
"SIMILARITY_THRESHOLD": 0.85,
"DATASET_PATHS": {
"general": ["data/general.json"],
"programming_software_dev": ["data/programming_software_dev.json"],
"python": [
"data/python_mbpp.json",
"data/python_programming.json",
"data/python_transformer_model.json"
],
"rust": [
"data/rust_ai_language_model.json",
"data/rust_blockchain.json",
"data/rust_mbrp.json",
"data/rust_programming.json"
],
"solidity": ["data/solidity_programming.json"],
"computer": [
"data/computer_advanced_debugging.json",
"data/computer_agenticAI.json",
"data/computer_architecture.json",
"data/computer_cloud_security.json",
"data/computer_cloudCI-CD.json",
"data/computer_creativity.json",
"data/computer_crossplatform.json",
"data/computer_cybersecurity.json",
"data/computer_error_handling_examples.json",
"data/computer_gitInstruct.json"
],
"cpp": [
"data/cpp_ai_language_model.json",
"data/cpp_blockchain.json",
"data/cpp_mbcppp.json",
"data/cpp_programming.json"
],
"go": [
"data/golang_ai_language_model.json",
"data/golang_mbgp.json",
"data/golang_programming.json"
],
"java": [
"data/java_ai_language_model.json",
"data/java_blockchain.json",
"data/java_mbjp.json",
"data/java_programming.json",
"data/java_transformer_language_model.json"
],
"javascript": [
"data/javascript_chatbot.json",
"data/javascript_n_Typescript_backend.json",
"data/javascript_n_Typescript_frontend.json",
"data/javascript_n_Typescript_programming.json"
],
"mathematics": [
"data/mathematics.json",
"data/mathematics_training.json"
],
"nim": [
"data/nim_ai_language_model.json",
"data/nim_blockchain.json",
"data/nim_chatbot.json",
"data/nim_conversation.json",
"data/nim_mbnp.json",
"data/nim_programming.json"
],
"other_information": ["data/other_information.json"],
"physics": [
"data/physics_n_engineering.json",
"data/physics_n_engineering_applied.json",
"data/project_structure.json",
"data/python_chatbot_guide.json"
]
},
"LAZY_LOADING_ENABLED": true,
"MAX_INITIAL_SPECIALIZATIONS": 2,
"train_file_path": "data/computer_advanced_debugging.json",
"NUM_EPOCHS": 50,
"LEARNING_RATE": 0.0001,
"INPUT_SIZE": 768,
"OUTPUT_SIZE": 768,
"SPECIALIZATIONS": [
"python",
"rust",
"solidity",
"computer",
"cpp",
"go",
"java",
"javascript",
"mathematics",
"nim",
"other_information",
"physics"
],
"PREPROCESSING": {
"LOWERCASE": true,
"REMOVE_SPECIAL_CHARACTERS": true,
"REPLACE_MULTIPLE_SPACES": true
},
"STDP_CONFIG": {
"WEIGHT_THRESHOLD": 0.5,
"ACTIVATION_THRESHOLD": 0.2,
"USE_SNN": true,
"ALPHA": 0.1,
"BETA": 0.2,
"BASE_DIR": "checkpoints",
"SNN_FILENAME_FORMAT": "snn_model_{specialization}_{epoch}.pt",
"STDPLearningRate": 0.01,
"STDPMemDecay": 0.9,
"SpikeThreshold": 0.5,
"firing_rate": 10,
"MAX_SEQ_LENGTH": 2048,
"STDP_PRETRAIN_EPOCHS": 5,
"STDP_FINETUNE_EPOCHS": 3,
"BATCH_SIZE_PRETRAIN": 32,
"BATCH_SIZE_FINETUNE": 16,
"NUM_NEURONS": 1024,
"MAX_RATE": 100
},
"TRAINING_CONFIG": {
"PATIENCE": 3,
"DELTA": 0.001,
"VERBOSE": true,
"NUM_EPOCHS": 20,
"LEARNING_RATE": 0.0001,
"TRANSFORMER_LEARNING_RATE": 5e-5,
"TRANSFORMER_NUM_EPOCHS": 20
},
"CHECKPOINT_CONFIG": {
"PATH": "checkpoints",
"BASE_DIR": "checkpoints",
"TRANSFORMER_FILENAME_FORMAT": "transformer_model_{specialization}_{epoch}.pt",
"SNN_FILENAME_FORMAT": "snn_model_{specialization}_{epoch}.pt"
},
"GENERATION_CONFIG": {
"temperature": 0.7,
"top_p": 0.9,
"num_return_sequences": 1
},
"TOKENIZER_CONFIG": {
"MODEL_NAME": "gpt2",
"MAX_SEQ_LENGTH": 1024,
"POOLING_MODE": "last"
},
"DATA_LOADER_CONFIG": {
"BATCH_SIZE": 32,
"NUM_WORKERS": 0,
"SHUFFLE": true,
"INCLUDE_CRAWL": true
},
"ATTENTION_CONFIG": {
"WINDOW_SIZE": 256,
"STRIDE": 128,
"MEMORY_SIZE": 64,
"NUM_HEADS": 8,
"ATTENTION_DROPOUT": 0.1,
"ATTENTION_TYPES": {
"SLIDING": true,
"HIERARCHICAL": true,
"GLOBAL": true
},
"PROMPT_THRESHOLDS": {
"LENGTH_THRESHOLD": 500,
"COMPLEXITY_THRESHOLD": 0.7,
"PERPLEXITY_THRESHOLD": 50
},
"ATTENTION_WEIGHTS": {
"SHORT_COMPLEX": {
"SLIDING": 0.4,
"HIERARCHICAL": 0.6
},
"LONG_CONTEXT": {
"SLIDING": 0.3,
"HIERARCHICAL": 0.4,
"GLOBAL": 0.3
}
}
},
"TRANSFORMER_CONFIG": {
"TEST_MODE": false,
"LOGGING_LEVEL": "INFO",
"LOG_FILE": "logs/training.log",
"SAVE_CHECKPOINTS": true,
"BASE_DIR": "checkpoints",
"TRANSFORMER_FILENAME_FORMAT": "transformer_model_{specialization}_{epoch}.pt",
"MODEL_NAME": "gpt2",
"MAX_SEQ_LENGTH": 767,
"NUM_EPOCHS": 20,
"LEARNING_RATE": 5e-5,
"BATCH_SIZE": 32,
"EMBEDDING_DIM": 768,
"NUM_HEADS": 12,
"HIDDEN_DIM": 768,
"NUM_LAYERS": 12,
"DROPOUT": 0.1,
"specialization1": "cpp",
"specialization2": "java",
"specialization3": "go",
"specialization4": "javascript",
"specialization5": "nim",
"specialization6": "python",
"specialization7": "rust",
"specialization8": "solidity",
"specialization9": "computer",
"specialization10": "mathematics",
"specialization11": "physics",
"specialization12": "other_information",
"DATASET_PATH": "data/cpp_ai_language_model.json",
"OUTPUT_SIZE": 768,
"POOLING_MODE": "mean",
"VOCAB_SIZE": 50257,
"MAX_RATE": 100,
"MODE": "pretrained",
"MODE2": "custom",
"SHUFFLE": true,
"SIMILARITY_THRESHOLD": 0.85,
"USE_PRETRAINED_ENCODER": true,
"ATTENTION_MECHANISM": {
"TYPE": "hybrid",
"WINDOW_SIZE": 1024,
"STRIDE": 512,
"USE_MEMORY": true
}
},
"DUAL_ENCODER_CONFIG": {
"USE_PRETRAINED_ENCODER": true,
"USE_CUSTOM_ENCODER": true,
"DEBUG": false
},
"PROMPT_ANALYZER_CONFIG": {
"MODEL_NAME": "gpt2",
"DATASET_PATH": null,
"SPECIALIZATION": null,
"HIDDEN_DIM": 768,
"MAX_CACHE_SIZE": 10
},
"MODEL_PRIORITY": {
"PRIMARY": "model_Custm",
"SECONDARY": "model_PrTr",
"USE_PRETRAINED_FALLBACK": true
},
"MAX_ACTIVE_MODELS": 5,
"MODEL_IDLE_THRESHOLD": 600,
"MAX_MEMORY_USAGE": 0.8,
"TOP_K": 3,
"TOPIC_KEYWORDS": {
"programming": ["python", "java", "javascript", "typescript", "rust", "go", "golang",
"c++", "cpp", "c#", "ruby", "php", "perl", "swift", "kotlin", "scala",
"html", "css", "sql", "database", "code", "function", "class", "method",
"algorithm", "data structure", "api", "http", "rest", "graphql", "json"],
"computer_science": ["algorithm", "complexity", "big o", "data structure", "graph", "tree", "hash table",
"linked list", "stack", "queue", "heap", "binary search", "sorting", "recursion",
"dynamic programming", "greedy algorithm", "backtracking", "computational", "turing"],
"software_engineering": ["design pattern", "architecture", "solid principles", "agile", "scrum", "kanban",
"waterfall", "ci/cd", "continuous integration", "continuous deployment", "testing",
"unit test", "integration test", "e2e test", "test-driven", "tdd", "bdd"],
"web_development": ["frontend", "backend", "full-stack", "web app", "spa", "pwa", "responsive",
"mobile-first", "css framework", "react", "angular", "vue", "svelte", "next.js"]
}
}