Vilyam888
/

Code_analyze.1.0

Text Generation

text-generation-inference

Model card Files Files and versions

Code_analyze.1.0 / inference.py

Vilyam888's picture

Upload folder using huggingface_hub

76fc70e verified 3 months ago

3.13 kB

	"""
	Inference code for Code Analyzer Model
	This file enables the "Use this model" button on Hugging Face.
	"""

	from transformers import AutoModelForCausalLM, AutoTokenizer
	import torch


	def load_model_and_tokenizer(model_name: str):
	"""Load model and tokenizer"""
	tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
	model = AutoModelForCausalLM.from_pretrained(
	model_name,
	torch_dtype=torch.bfloat16 if torch.cuda.is_available() else torch.float32,
	device_map="auto",
	trust_remote_code=True
	)
	return model, tokenizer


	def build_input(task, code):
	"""Build input in the same format as used during training"""
	parts = []
	if task.strip():
	parts.append(f"Задача:\n{task.strip()}")
	if code.strip():
	parts.append(f"Решение (код):\n```python\n{code.strip()}\n```")
	return "\n\n".join(parts)


	def generate_response(
	model,
	tokenizer,
	task: str,
	code: str,
	max_new_tokens: int = 1024,
	temperature: float = 0.7,
	top_p: float = 0.8,
	top_k: int = 20,
	repetition_penalty: float = 1.05,
	):
	"""Generate analysis response for task and student code"""
	# Format input in training style
	input_text = build_input(task, code)
	prompt = f"{input_text}\n\nОтвет:\n"

	inputs = tokenizer(prompt, return_tensors="pt").to(model.device)

	with torch.no_grad():
	outputs = model.generate(
	**inputs,
	max_new_tokens=max_new_tokens,
	temperature=temperature,
	top_p=top_p,
	top_k=top_k,
	repetition_penalty=repetition_penalty,
	do_sample=True,
	pad_token_id=tokenizer.eos_token_id
	)

	response = tokenizer.decode(outputs[0], skip_special_tokens=True)
	# Extract only the answer part
	if "Ответ:" in response:
	response = response.split("Ответ:")[-1].strip()

	return response


	if __name__ == "__main__":
	# Example usage
	import json

	model_name = "Vilyam888/Code_analyze.1.0"

	print("Loading model...")
	model, tokenizer = load_model_and_tokenizer(model_name)

	# Example: task and student code
	task = "Напишите функцию, которая принимает список чисел и возвращает сумму всех элементов."
	code = """def sum_list(numbers):
	total = 0
	for num in numbers:
	total += num
	return total"""

	print(f"\nЗадача: {task}")
	print(f"\nКод студента:\n{code}\n")
	print("Generating analysis...")

	response = generate_response(model, tokenizer, task, code)

	# Try to parse as JSON
	try:
	result = json.loads(response)
	print(f"\nРезультат анализа (JSON):")
	print(json.dumps(result, ensure_ascii=False, indent=2))
	except json.JSONDecodeError:
	print(f"\nРезультат анализа:\n{response}")