PredictiveManish
/

Trimurti-LM

+{
+	"model_id": "trimurti-lm",
+	"model_name": "Trimurti-LM",
+	"model_type": "language_model",
+	"architecture": "GPT2",
+	"framework": "transformers",
+	"languages": {
+		"supported": ["en", "hi", "pa"],
+		"language_tags": ["[EN]", "[HI]", "[PA]"],
+		"description": "Trilingual language model supporting English, Hindi, and Punjabi"
+	},
+	"model_config": {
+		"vocab_size": 8000,
+		"n_positions": 128,
+		"n_embd": 256,
+		"n_layer": 4,
+		"n_head": 4,
+		"n_inner": 512,
+		"activation_function": "gelu_new",
+		"attn_pdrop": 0.1,
+		"embd_pdrop": 0.1,
+		"resid_pdrop": 0.1,
+		"estimated_parameters": "4.7M"
+	},
+	"tokenizer": {
+		"type": "sentencepiece",
+		"model_type": "unigram",
+		"vocab_size": 8000,
+		"character_coverage": 0.9995,
+		"byte_fallback": true,
+		"model_path": "final_corpus/multilingual_spm.model"
+	},
+	"training": {
+		"corpus": "final_corpus/multilingual_corpus_train.txt",
+		"validation": "final_corpus/multilingual_corpus_val.txt",
+		"total_steps": 5000,
+		"batch_size": 2,
+		"gradient_accumulation": 8,
+		"learning_rate": 2e-4,
+		"warmup_steps": 1000,
+		"effective_batch_size": 16
+	},
+	"checkpoints": {
+		"path": "checkpoints_tiny",
+		"available_checkpoints": [
+			"step1000",
+			"step2000",
+			"step3000",
+			"step4000",
+			"step5000",
+			"final"
+		]
+	},
+	"evaluation": {
+		"overall_accuracy": 100.0,
+		"english_accuracy": 100.0,
+		"hindi_accuracy": 100.0,
+		"punjabi_accuracy": 100.0,
+		"mixed_accuracy": 100.0,
+		"avg_english_perplexity": 42.29,
+		"avg_hindi_perplexity": 50.56,
+		"avg_punjabi_perplexity": 63.42
+	},
+	"entry_points": {
+		"training": "python train_model.py",
+		"testing": "python test_model.py",
+		"evaluation": "python evaluate_model.py",
+		"preprocessing": "python preprocess.py",
+		"web_interface": "python web_interface.py"
+	},
+	"dependencies": [
+		"torch",
+		"transformers",
+		"sentencepiece",
+		"tqdm",
+		"gradio",
+		"pandas",
+		"numpy"
+	],
+	"filter": [
+		{
+			"bool": {
+				"should": [
+					{
+						"term": { "path": "model_index.json" }
+					},
+					{
+						"regexp": { "path": "[^/]*\\.safetensors" }
+					},
+					{
+						"regexp": { "path": "[^/]*\\.ckpt" }
+					},
+					{
+						"regexp": { "path": "[^/]*\\.bin" }
+					}
+				],
+				"minimum_should_match": 1
+			}
+		}
+	],
+	"files": [
+		{
+			"path": "checkpoints_tiny/final/model.safetensors",
+			"description": "Final trained model weights"
+		},
+		{
+			"path": "checkpoints_tiny/final/config.json",
+			"description": "Model configuration"
+		},
+		{
+			"path": "checkpoints_tiny/final/generation_config.json",
+			"description": "Generation settings"
+		},
+		{
+			"path": "final_corpus/multilingual_spm.model",
+			"description": "SentencePiece tokenizer model"
+		},
+		{
+			"path": "final_corpus/multilingual_spm.vocab",
+			"description": "Tokenizer vocabulary"
+		},
+		{
+			"path": "train_model.py",
+			"description": "Training script"
+		},
+		{
+			"path": "test_model.py",
+			"description": "Testing and inference script"
+		},
+		{
+			"path": "evaluate_model.py",
+			"description": "Evaluation script"
+		},
+		{
+			"path": "preprocess.py",
+			"description": "Data preprocessing script"
+		},
+		{
+			"path": "web_interface.py",
+			"description": "Gradio web interface"
+		}
+	]
+}