Upload config.json

928a969 verified 10 months ago

8.38 kB

	{
	"model_type": "wildnerve_tlm01",
	"architectures": ["Wildnerve_tlm01"],
	"SELECTED_MODEL": ["model_Custm.py", "model_PrTr.py"],
	"MODEL_NAME": "Wildnerve-tlm01_Hybrid_Model",
	"BASE_DATA_DIR": "data",
	"FILE_FORMATS": ["csv", "json", "txt"],
	"MAX_SEQ_LENGTH": 767,
	"SIMILARITY_THRESHOLD": 0.85,
	"DATASET_PATHS": {
	"general": ["data/general.json"],
	"programming_software_dev": ["data/programming_software_dev.json"],
	"python": [
	"data/python_mbpp.json",
	"data/python_programming.json",
	"data/python_transformer_model.json"
	],
	"rust": [
	"data/rust_ai_language_model.json",
	"data/rust_blockchain.json",
	"data/rust_mbrp.json",
	"data/rust_programming.json"
	],
	"solidity": ["data/solidity_programming.json"],
	"computer": [
	"data/computer_advanced_debugging.json",
	"data/computer_agenticAI.json",
	"data/computer_architecture.json",
	"data/computer_cloud_security.json",
	"data/computer_cloudCI-CD.json",
	"data/computer_creativity.json",
	"data/computer_crossplatform.json",
	"data/computer_cybersecurity.json",
	"data/computer_error_handling_examples.json",
	"data/computer_gitInstruct.json"
	],
	"cpp": [
	"data/cpp_ai_language_model.json",
	"data/cpp_blockchain.json",
	"data/cpp_mbcppp.json",
	"data/cpp_programming.json"
	],
	"go": [
	"data/golang_ai_language_model.json",
	"data/golang_mbgp.json",
	"data/golang_programming.json"
	],
	"java": [
	"data/java_ai_language_model.json",
	"data/java_blockchain.json",
	"data/java_mbjp.json",
	"data/java_programming.json",
	"data/java_transformer_language_model.json"
	],
	"javascript": [
	"data/javascript_chatbot.json",
	"data/javascript_n_Typescript_backend.json",
	"data/javascript_n_Typescript_frontend.json",
	"data/javascript_n_Typescript_programming.json"
	],
	"mathematics": [
	"data/mathematics.json",
	"data/mathematics_training.json"
	],
	"nim": [
	"data/nim_ai_language_model.json",
	"data/nim_blockchain.json",
	"data/nim_chatbot.json",
	"data/nim_conversation.json",
	"data/nim_mbnp.json",
	"data/nim_programming.json"
	],
	"other_information": ["data/other_information.json"],
	"physics": [
	"data/physics_n_engineering.json",
	"data/physics_n_engineering_applied.json",
	"data/project_structure.json",
	"data/python_chatbot_guide.json"
	]
	},
	"LAZY_LOADING_ENABLED": true,
	"MAX_INITIAL_SPECIALIZATIONS": 2,
	"train_file_path": "data/computer_advanced_debugging.json",
	"NUM_EPOCHS": 50,
	"LEARNING_RATE": 0.0001,
	"INPUT_SIZE": 768,
	"OUTPUT_SIZE": 768,
	"SPECIALIZATIONS": [
	"python",
	"rust",
	"solidity",
	"computer",
	"cpp",
	"go",
	"java",
	"javascript",
	"mathematics",
	"nim",
	"other_information",
	"physics"
	],
	"PREPROCESSING": {
	"LOWERCASE": true,
	"REMOVE_SPECIAL_CHARACTERS": true,
	"REPLACE_MULTIPLE_SPACES": true
	},
	"STDP_CONFIG": {
	"WEIGHT_THRESHOLD": 0.5,
	"ACTIVATION_THRESHOLD": 0.2,
	"USE_SNN": true,
	"ALPHA": 0.1,
	"BETA": 0.2,
	"BASE_DIR": "checkpoints",
	"SNN_FILENAME_FORMAT": "snn_model_{specialization}_{epoch}.pt",
	"STDPLearningRate": 0.01,
	"STDPMemDecay": 0.9,
	"SpikeThreshold": 0.5,
	"firing_rate": 10,
	"MAX_SEQ_LENGTH": 2048,
	"STDP_PRETRAIN_EPOCHS": 5,
	"STDP_FINETUNE_EPOCHS": 3,
	"BATCH_SIZE_PRETRAIN": 32,
	"BATCH_SIZE_FINETUNE": 16,
	"NUM_NEURONS": 1024,
	"MAX_RATE": 100
	},
	"TRAINING_CONFIG": {
	"PATIENCE": 3,
	"DELTA": 0.001,
	"VERBOSE": true,
	"NUM_EPOCHS": 20,
	"LEARNING_RATE": 0.0001,
	"TRANSFORMER_LEARNING_RATE": 5e-5,
	"TRANSFORMER_NUM_EPOCHS": 20
	},
	"CHECKPOINT_CONFIG": {
	"PATH": "checkpoints",
	"BASE_DIR": "checkpoints",
	"TRANSFORMER_FILENAME_FORMAT": "transformer_model_{specialization}_{epoch}.pt",
	"SNN_FILENAME_FORMAT": "snn_model_{specialization}_{epoch}.pt"
	},
	"GENERATION_CONFIG": {
	"temperature": 0.7,
	"top_p": 0.9,
	"num_return_sequences": 1
	},
	"TOKENIZER_CONFIG": {
	"MODEL_NAME": "gpt2",
	"MAX_SEQ_LENGTH": 1024,
	"POOLING_MODE": "last"
	},
	"DATA_LOADER_CONFIG": {
	"BATCH_SIZE": 32,
	"NUM_WORKERS": 0,
	"SHUFFLE": true,
	"INCLUDE_CRAWL": true
	},
	"ATTENTION_CONFIG": {
	"WINDOW_SIZE": 256,
	"STRIDE": 128,
	"MEMORY_SIZE": 64,
	"NUM_HEADS": 8,
	"ATTENTION_DROPOUT": 0.1,
	"ATTENTION_TYPES": {
	"SLIDING": true,
	"HIERARCHICAL": true,
	"GLOBAL": true
	},
	"PROMPT_THRESHOLDS": {
	"LENGTH_THRESHOLD": 500,
	"COMPLEXITY_THRESHOLD": 0.7,
	"PERPLEXITY_THRESHOLD": 50
	},
	"ATTENTION_WEIGHTS": {
	"SHORT_COMPLEX": {
	"SLIDING": 0.4,
	"HIERARCHICAL": 0.6
	},
	"LONG_CONTEXT": {
	"SLIDING": 0.3,
	"HIERARCHICAL": 0.4,
	"GLOBAL": 0.3
	}
	}
	},
	"TRANSFORMER_CONFIG": {
	"TEST_MODE": false,
	"LOGGING_LEVEL": "INFO",
	"LOG_FILE": "logs/training.log",
	"SAVE_CHECKPOINTS": true,
	"BASE_DIR": "checkpoints",
	"TRANSFORMER_FILENAME_FORMAT": "transformer_model_{specialization}_{epoch}.pt",
	"MODEL_NAME": "gpt2",
	"MAX_SEQ_LENGTH": 767,
	"NUM_EPOCHS": 20,
	"LEARNING_RATE": 5e-5,
	"BATCH_SIZE": 32,
	"EMBEDDING_DIM": 768,
	"NUM_HEADS": 12,
	"HIDDEN_DIM": 768,
	"NUM_LAYERS": 12,
	"DROPOUT": 0.1,
	"specialization1": "cpp",
	"specialization2": "java",
	"specialization3": "go",
	"specialization4": "javascript",
	"specialization5": "nim",
	"specialization6": "python",
	"specialization7": "rust",
	"specialization8": "solidity",
	"specialization9": "computer",
	"specialization10": "mathematics",
	"specialization11": "physics",
	"specialization12": "other_information",
	"DATASET_PATH": "data/cpp_ai_language_model.json",
	"OUTPUT_SIZE": 768,
	"POOLING_MODE": "mean",
	"VOCAB_SIZE": 50257,
	"MAX_RATE": 100,
	"MODE": "pretrained",
	"MODE2": "custom",
	"SHUFFLE": true,
	"SIMILARITY_THRESHOLD": 0.85,
	"USE_PRETRAINED_ENCODER": true,
	"ATTENTION_MECHANISM": {
	"TYPE": "hybrid",
	"WINDOW_SIZE": 1024,
	"STRIDE": 512,
	"USE_MEMORY": true
	}
	},
	"DUAL_ENCODER_CONFIG": {
	"USE_PRETRAINED_ENCODER": true,
	"USE_CUSTOM_ENCODER": true,
	"DEBUG": false
	},
	"PROMPT_ANALYZER_CONFIG": {
	"MODEL_NAME": "gpt2",
	"DATASET_PATH": null,
	"SPECIALIZATION": null,
	"HIDDEN_DIM": 768,
	"MAX_CACHE_SIZE": 10
	},
	"MODEL_PRIORITY": {
	"PRIMARY": "model_Custm",
	"SECONDARY": "model_PrTr",
	"USE_PRETRAINED_FALLBACK": true
	},
	"MAX_ACTIVE_MODELS": 5,
	"MODEL_IDLE_THRESHOLD": 600,
	"MAX_MEMORY_USAGE": 0.8,
	"TOP_K": 3,
	"TOPIC_KEYWORDS": {
	"programming": ["python", "java", "javascript", "typescript", "rust", "go", "golang",
	"c++", "cpp", "c#", "ruby", "php", "perl", "swift", "kotlin", "scala",
	"html", "css", "sql", "database", "code", "function", "class", "method",
	"algorithm", "data structure", "api", "http", "rest", "graphql", "json"],
	"computer_science": ["algorithm", "complexity", "big o", "data structure", "graph", "tree", "hash table",
	"linked list", "stack", "queue", "heap", "binary search", "sorting", "recursion",
	"dynamic programming", "greedy algorithm", "backtracking", "computational", "turing"],
	"software_engineering": ["design pattern", "architecture", "solid principles", "agile", "scrum", "kanban",
	"waterfall", "ci/cd", "continuous integration", "continuous deployment", "testing",
	"unit test", "integration test", "e2e test", "test-driven", "tdd", "bdd"],
	"web_development": ["frontend", "backend", "full-stack", "web app", "spa", "pwa", "responsive",
	"mobile-first", "css framework", "react", "angular", "vue", "svelte", "next.js"]
	}
	}