Spaces:

SallySims
/

AnthroBot

Sleeping

App Files Files Community

AnthroBot / app.py

SallySims

Update app.py

6bc2197 verified 9 months ago

raw

history blame contribute delete

7.69 kB

	## Deploying on HuggingFace

	import streamlit as st
	import pandas as pd
	import torch
	import os
	from huggingface_hub import login
	from transformers import AutoTokenizer, AutoModelForCausalLM, TextStreamer
	from peft import PeftModel, PeftConfig
	import io
	from transformers.tokenization_utils_base import BatchEncoding

	# Login using Hugging Face token
	try:
	login(token=os.getenv("HUGGINGFACEHUB_TOKEN"))
	except Exception as e:
	st.error(f"Error logging in to Hugging Face: {str(e)}")
	st.stop()

	st.set_page_config(page_title="AnthroBot", page_icon="🤖", layout="centered")

	# Load model & tokenizer
	@st.cache_resource
	def load_model():
	try:
	peft_config = PeftConfig.from_pretrained("SallySims/AnthroBot_Model_Lora")
	base_model = AutoModelForCausalLM.from_pretrained(
	peft_config.base_model_name_or_path,
	torch_dtype=torch.float16,
	device_map="auto",
	trust_remote_code=True,
	token=True
	)
	model = PeftModel.from_pretrained(base_model, "SallySims/AnthroBot_Model_Lora")
	model.eval()

	tokenizer = AutoTokenizer.from_pretrained(
	peft_config.base_model_name_or_path,
	trust_remote_code=True,
	token=True
	)
	tokenizer.pad_token = tokenizer.eos_token
	tokenizer.pad_token_id = tokenizer.eos_token_id # Set pad_token_id to eos_token_id (128001)

	st.write("✅ Model and tokenizer loaded successfully.")
	return model, tokenizer
	except Exception as e:
	st.error(f"Error loading model: {str(e)}")
	raise e

	model, tokenizer = load_model()

	# Initialize session state for prediction history
	if 'history' not in st.session_state:
	st.session_state.history = []

	# Prediction function
	device = "cuda" if torch.cuda.is_available() else "cpu"

	def generate_response(age, sex, height_cm, weight_kg, wc_cm):
	try:
	# Create prompt
	prompt = f"Age: {age}, Sex: {sex}, Height: {height_cm} cm, Weight: {weight_kg} kg, WC: {wc_cm} cm"
	st.write(f"📝 Prompt Sent to Model: `{prompt}`")

	# Create message structure
	messages = [{"role": "user", "content": prompt}]

	# Tokenize the input
	try:
	inputs = tokenizer.apply_chat_template(
	messages,
	tokenize=True,
	add_generation_prompt=True,
	return_tensors="pt",
	max_length=512,
	truncation=True,
	return_dict=True
	)
	except Exception as e:
	st.warning(f"apply_chat_template failed: {str(e)}. Falling back to manual tokenization.")
	inputs = tokenizer(
	prompt,
	return_tensors="pt",
	max_length=512,
	truncation=True,
	padding=False,
	return_attention_mask=True
	)

	# Debug: Log inputs structure
	st.write(f"Inputs type: {type(inputs)}")
	st.write(f"Inputs keys: {list(inputs.keys()) if isinstance(inputs, (dict, BatchEncoding)) else 'N/A'}")

	# Handle inputs
	if isinstance(inputs, (dict, BatchEncoding)):
	input_ids = inputs['input_ids']
	attention_mask = inputs.get('attention_mask', torch.ones_like(input_ids))
	elif isinstance(inputs, torch.Tensor):
	input_ids = inputs
	attention_mask = torch.ones_like(input_ids)
	else:
	st.error(f"Unexpected inputs format: {type(inputs)}")
	return None

	# Ensure 2D tensors
	if len(input_ids.shape) == 1:
	input_ids = input_ids.unsqueeze(0)
	attention_mask = attention_mask.unsqueeze(0)
	elif len(input_ids.shape) > 2:
	input_ids = input_ids.squeeze()
	attention_mask = attention_mask.squeeze()
	if len(input_ids.shape) == 1:
	input_ids = input_ids.unsqueeze(0)
	attention_mask = attention_mask.unsqueeze(0)

	st.write(f"Input IDs shape: {input_ids.shape}")
	st.write(f"Attention mask shape: {attention_mask.shape}")

	# Move to device
	input_ids = input_ids.to(device)
	attention_mask = attention_mask.to(device)

	# Generate output
	st.write("🤖 Model response:")
	with st.empty():
	text_streamer = TextStreamer(tokenizer, skip_prompt=True, skip_special_tokens=False)
	output = model.generate(
	input_ids=input_ids,
	attention_mask=attention_mask,
	max_new_tokens=250,
	temperature=0.7,
	top_p=0.95,
	do_sample=True,
	pad_token_id=tokenizer.eos_token_id,
	use_cache=True,
	streamer=text_streamer
	)

	# Decode the output
	decoded = tokenizer.decode(output[0], skip_special_tokens=False)
	st.write(f"Decoded output: {decoded}")

	# Update history
	st.session_state.history.append((prompt, decoded))
	return decoded

	except Exception as e:
	st.error(f"Error during generation: {str(e)}")
	return None

	# UI Header
	st.title("🧠 AnthroBot")
	st.markdown("Enter your anthropometric details to receive an AI-generated summary of health metrics.")

	# Tabs for input method
	tab1, tab2 = st.tabs(["🧍 Manual Input", "📄 CSV Upload"])

	with tab1:
	st.subheader("Manual Entry")
	age = st.number_input("Age", min_value=1, max_value=120, value=30)
	sex = st.selectbox("Sex", options=["male", "female"])
	height = st.number_input("Height (cm)", min_value=50.0, max_value=250.0, value=170.0)
	weight = st.number_input("Weight (kg)", min_value=10.0, max_value=300.0, value=70.0)
	wc = st.number_input("Waist Circumference (cm)", min_value=20.0, max_value=200.0, value=80.0)

	if st.button("Estimate Metrics"):
	prediction = generate_response(age, sex, height, weight, wc)
	if prediction:
	st.success("Prediction:")
	st.write(prediction)

	# Display history
	st.subheader("Prediction History")
	for prompt, response in st.session_state.history:
	st.markdown(f"Input: {prompt}")
	st.markdown(f"Output: {response}")

	with tab2:
	st.subheader("Batch Upload via CSV")
	sample_csv = pd.DataFrame({
	"Age": [30],
	"Sex": ["male"],
	"Height": [170.0],
	"Weight": [70.0],
	"WC": [80.0]
	})

	st.download_button("📥 Download Sample CSV", sample_csv.to_csv(index=False), file_name="sample_input.csv")

	uploaded_file = st.file_uploader("Upload your CSV file", type=["csv"])

	if uploaded_file:
	df = pd.read_csv(uploaded_file)
	if not all(col in df.columns for col in ["Age", "Sex", "Height", "Weight", "WC"]):
	st.error("CSV must contain columns: Age, Sex, Height, Weight, WC")
	else:
	outputs = []
	with st.spinner("Generating predictions..."):
	for _, row in df.iterrows():
	prediction = generate_response(row['Age'], row['Sex'], row['Height'], row['Weight'], row['WC'])
	outputs.append(prediction if prediction else "Error")

	df["Prediction"] = outputs
	st.success("Here are your predictions:")
	st.dataframe(df)

	csv_output = df.to_csv(index=False).encode("utf-8")
	st.download_button("📤 Download Predictions", data=csv_output, file_name="predictions.csv")

	# Clear history button
	if st.button("Clear History"):
	st.session_state.history = []
	st.rerun()