mycholpath
/

RA-Mistral-7B

Text Generation

Model card Files Files and versions

RA-Mistral-7B / fix_interference_api.py

mycholpath's picture

Upload folder using huggingface_hub

f480253 verified 11 months ago

history blame contribute delete

2.6 kB

	import os
	import json
	import yaml
	import torch
	from transformers import AutoTokenizer, AutoModelForCausalLM
	import logging
	import time

	# Add more detailed logging
	logging.basicConfig(level=logging.INFO)
	logger = logging.getLogger(__name__)

	def test_model_loading(base_model='mistralai/Mistral-7B-Instruct-v0.3', timeout=600):
	try:
	start_time = time.time()

	# Log more details about download process
	logger.info(f"Attempting to load tokenizer from {base_model}")
	tokenizer = AutoTokenizer.from_pretrained(
	base_model,
	# Add cache directory explicitly
	cache_dir='./model_cache',
	# Add timeout parameters
	use_auth_token=False,
	local_files_only=False,
	resume_download=True
	)

	logger.info(f"Tokenizer loaded. Setting pad token if needed.")
	if tokenizer.pad_token is None:
	tokenizer.pad_token = tokenizer.eos_token

	# Log model loading with more parameters
	logger.info(f"Loading model with extended timeout handling")
	model = AutoModelForCausalLM.from_pretrained(
	base_model,
	cache_dir='./model_cache',
	use_auth_token=False,
	local_files_only=False,
	resume_download=True,
	# Optional: Force download if needed
	force_download=False,
	# Optional: Use torch compile for potential performance
	torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32
	)

	# Rest of the generation code remains the same
	input_text = "Hello, how are you today?"
	inputs = tokenizer(
	input_text,
	return_tensors="pt",
	padding=True,
	add_special_tokens=True,
	return_attention_mask=True
	)

	with torch.no_grad():
	output = model.generate(
	input_ids=inputs['input_ids'],
	attention_mask=inputs['attention_mask'],
	max_length=20,
	num_return_sequences=1,
	do_sample=False
	)

	generated_text = tokenizer.decode(output[0], skip_special_tokens=True)
	logger.info(f"Generation successful: {generated_text}")

	return True

	except Exception as e:
	logger.error(f"Detailed error during model loading: {e}")
	import traceback
	traceback.print_exc()
	return False

	if __name__ == '__main__':
	test_model_loading()