Spaces:

yatinece
/

ai_docker

Sleeping

App Files Files Community

ai_docker / saveFullModel.py

yatinece

Add application file

4e78d70 2 months ago

raw

history blame contribute delete

7.43 kB

	import torch
	import torch.nn as nn
	from torchvision import models
	import os

	class AIDetectorModel(nn.Module):
	def __init__(self, num_classes=2, dropout_prob=0.3, load_pretrained=True):
	super(AIDetectorModel, self).__init__()

	if load_pretrained:
	print("📥 Loading RegNet with pre-trained weights...")
	self.backbone = models.regnet_y_16gf(weights=models.RegNet_Y_16GF_Weights.IMAGENET1K_SWAG_E2E_V1)
	else:
	self.backbone = models.regnet_y_16gf(weights=None)

	# Freeze most layers
	for param in self.backbone.parameters():
	param.requires_grad = False

	# Unfreeze last block
	if hasattr(self.backbone, 'trunk_output') and hasattr(self.backbone.trunk_output, 'block4'):
	self.backbone.trunk_output.block4.requires_grad_(True)

	# Replace average pooling with max pooling
	self.backbone.avgpool = nn.AdaptiveMaxPool2d(output_size=(1, 1))

	# Get feature dimension
	num_ftrs = self.backbone.fc.in_features

	# Replace classifier
	self.backbone.fc = nn.Sequential(
	nn.Linear(num_ftrs, 2048),
	nn.SiLU(),
	nn.Dropout(dropout_prob),
	nn.Linear(2048, 1024),
	nn.SiLU(),
	nn.Dropout(dropout_prob),
	nn.Linear(1024, 512),
	nn.SiLU(),
	nn.Dropout(dropout_prob),
	nn.Linear(512, num_classes)
	)

	def forward(self, x):
	return self.backbone(x)

	def verify_complete_backbone(model):
	"""Verify that model has complete RegNet backbone - CORRECTED"""
	state_dict = model.state_dict()
	all_keys = list(state_dict.keys())

	# Check for actual RegNet components based on real structure
	stem_keys = [k for k in all_keys if 'backbone.stem' in k]
	block_keys = [k for k in all_keys if 'backbone.trunk_output.block' in k]
	proj_keys = [k for k in all_keys if 'backbone.trunk_output.block' in k and 'proj' in k]
	fc_keys = [k for k in all_keys if 'backbone.fc' in k]

	print(f"🔍 Backbone verification:")
	print(f" • Total keys: {len(all_keys)}")
	print(f" • Stem keys: {len(stem_keys)}")
	print(f" • Block keys: {len(block_keys)}")
	print(f" • Projection keys: {len(proj_keys)}")
	print(f" • FC keys: {len(fc_keys)}")

	# CORRECTED: RegNet Y 16GF has: ~420 block params, ~24 proj layers, 6 stem params
	is_complete = (
	len(block_keys) > 400 and # Should have ~420 block parameters
	len(stem_keys) > 5 and # Should have 6 stem parameters
	len(proj_keys) > 20 # Should have ~24 projection parameters
	)

	if is_complete:
	print("✅ Complete backbone verified!")
	print(f"✅ Found {len(block_keys)} blocks, {len(stem_keys)} stem, {len(proj_keys)} proj layers")
	else:
	print("❌ Incomplete backbone detected!")
	print(f"Expected: >400 blocks, >5 stem, >20 proj")
	print(f"Found: {len(block_keys)} blocks, {len(stem_keys)} stem, {len(proj_keys)} proj")

	return is_complete

	def create_truly_complete_model(trained_checkpoint_path, output_path):
	"""Create a truly complete model with full RegNet weights"""

	print("🔄 Creating TRULY complete offline model...")
	print("=" * 60)

	# Step 1: Create fresh model WITH pretrained weights
	print("📥 Step 1: Loading fresh RegNet with ImageNet weights...")
	fresh_model = AIDetectorModel(load_pretrained=True)

	# Step 2: Verify fresh model is complete (FIXED VALIDATION)
	print("\n🔍 Step 2: Verifying fresh model completeness...")
	if not verify_complete_backbone(fresh_model):
	raise RuntimeError("❌ Fresh model is not complete!")

	# Step 3: Load your trained weights
	print(f"\n📂 Step 3: Loading your trained weights from {trained_checkpoint_path}...")
	trained_checkpoint = torch.load(trained_checkpoint_path, map_location='cpu')

	if isinstance(trained_checkpoint, dict) and 'model_state_dict' in trained_checkpoint:
	trained_state = trained_checkpoint['model_state_dict']
	extra_info = {
	'num_classes': trained_checkpoint.get('num_classes', 2),
	'dropout_prob': trained_checkpoint.get('dropout_prob', 0.3),
	'epoch': trained_checkpoint.get('epoch', 0),
	'val_loss': trained_checkpoint.get('val_loss', 0.0)
	}
	else:
	trained_state = trained_checkpoint
	extra_info = {'num_classes': 2, 'dropout_prob': 0.3}

	# Step 4: Merge weights intelligently
	print("\n🔀 Step 4: Merging backbone + trained classifier...")
	fresh_state = fresh_model.state_dict()

	# Keep ALL backbone weights from fresh model (includes RegNet pretrained)
	# Replace ONLY classifier weights from trained model
	merged_state = fresh_state.copy()

	classifier_keys = [k for k in trained_state.keys() if 'backbone.fc' in k]
	print(f" • Replacing {len(classifier_keys)} classifier parameters")

	for key in classifier_keys:
	if key in trained_state:
	merged_state[key] = trained_state[key]
	print(f" ✅ Updated: {key}")

	# Step 5: Create final model and verify
	print("\n✅ Step 5: Creating final complete model...")
	final_model = AIDetectorModel(load_pretrained=False) # Empty architecture
	final_model.load_state_dict(merged_state) # Load merged weights

	# Final verification (should definitely pass now)
	print("\n🔍 Final verification:")
	if not verify_complete_backbone(final_model):
	raise RuntimeError("❌ Final model verification failed!")

	# Step 6: Save complete model
	print(f"\n💾 Step 6: Saving complete model to {output_path}...")
	complete_checkpoint = {
	'model_state_dict': merged_state,
	'complete_model': True,
	'backbone_included': True,
	'offline_ready': True,
	**extra_info
	}

	torch.save(complete_checkpoint, output_path)

	file_size = os.path.getsize(output_path) / (1024*1024)
	print(f"✅ SUCCESS! Complete model saved:")
	print(f" • File: {output_path}")
	print(f" • Size: {file_size:.1f}MB")
	print(f" • Ready for offline use!")

	return output_path

	if __name__ == "__main__":
	# Input and output paths
	input_model = "2_block_best_ai_detector.pth" # Your trained model
	output_model = "truly_complete_ai_detector_new.pth" # New complete model

	if not os.path.exists(input_model):
	print(f"❌ Trained model not found: {input_model}")
	# Show available files
	pth_files = [f for f in os.listdir('.') if f.endswith('.pth')]
	if pth_files:
	print("Available .pth files:")
	for f in pth_files:
	size = os.path.getsize(f) / (1024*1024)
	print(f" • {f} ({size:.1f}MB)")
	else:
	print("No .pth files found in current directory")
	else:
	try:
	result_path = create_truly_complete_model(input_model, output_model)
	print("\n" + "="*60)
	print(f"🎉 SUCCESS! Use this file in your offline app:")
	print(f"📁 {result_path}")
	print("="*60)
	except Exception as e:
	print(f"❌ Failed to create complete model: {e}")