cattlemodel / app.py
yougandar's picture
Create app.py
427dba7 verified
import streamlit as st
import pandas as pd
import random
import joblib
from sklearn.ensemble import RandomForestClassifier
from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report
import matplotlib.pyplot as plt
import seaborn as sns
import numpy as np
import os
# Load cattle data
DATA_FILE = 'cattle_data.csv'
def load_data():
# Check if the dataset exists
if os.path.exists(DATA_FILE):
return pd.read_csv(DATA_FILE)
else:
return pd.DataFrame(columns=['TAG ID', 'BREED', 'AGE', 'SURGERY', 'REPRODUCTION CYCLES', 'OTHER'])
# Function to generate random sensor data for a specific cow breed
def generate_sensor_data(cow_breed):
cow_data = {
'Holstein Friesian': {'body_temp': (38.0, 39.0), 'rumination': (600, 800), 'steps': (8000, 12000), 'behavior_score': (6, 8)},
'Girolando': {'body_temp': (38.0, 39.0), 'rumination': (650, 750), 'steps': (7000, 10000), 'behavior_score': (7, 9)},
'Jersey': {'body_temp': (38.0, 39.0), 'rumination': (650, 750), 'steps': (7500, 10500), 'behavior_score': (6, 8)},
'Sahiwal': {'body_temp': (38.0, 39.0), 'rumination': (550, 700), 'steps': (6500, 9000), 'behavior_score': (7, 9)},
'Kankrej': {'body_temp': (38.0, 39.0), 'rumination': (600, 750), 'steps': (7000, 10000), 'behavior_score': (7, 9)}
}
data = cow_data.get(cow_breed)
if not data:
return None
sensor_data = {
'Body Temperature (°C)': round(random.uniform(data['body_temp'][0], data['body_temp'][1]), 2),
'Rumination (min/day)': random.randint(data['rumination'][0], data['rumination'][1]),
'Step Count (steps/day)': random.randint(data['steps'][0], data['steps'][1]),
'Behavior Score (1-10)': random.randint(data['behavior_score'][0], data['behavior_score'][1])
}
return sensor_data
# Load the data and preprocess
df = load_data()
# Feature Engineering - Create features like daily trends or differences if needed
df['milk_yield_change'] = df['AGE'].diff().fillna(0) # Just an example to create a derived feature
# Merge sensor data with cattle profile
cow_breeds = ['Holstein Friesian', 'Girolando', 'Jersey', 'Sahiwal', 'Kankrej']
sensor_data_list = []
for breed in cow_breeds:
sensor_data = generate_sensor_data(breed)
if sensor_data:
sensor_data['TAG ID'] = random.randint(1, 100) # Random TAG ID for simulation
sensor_data['BREED'] = breed
sensor_data_list.append(sensor_data)
sensor_df = pd.DataFrame(sensor_data_list)
# Merge with the original cattle profile dataset
df = pd.merge(df, sensor_df, on='TAG ID', how='left')
# Model Training (Disease Prediction)
X = df[['Body Temperature (°C)', 'Rumination (min/day)', 'Step Count (steps/day)', 'Behavior Score (1-10)', 'AGE']]
y = df['OTHER'].apply(lambda x: 1 if x == 'Healthy' else 0) # Convert health status to binary (0 = not healthy, 1 = healthy)
# Data Preprocessing
scaler = StandardScaler()
X_scaled = scaler.fit_transform(X)
# Train Test Split
X_train, X_test, y_train, y_test = train_test_split(X_scaled, y, test_size=0.3, random_state=42)
# Train a Random Forest Classifier
model = RandomForestClassifier(n_estimators=100, random_state=42)
model.fit(X_train, y_train)
# Save the trained model
joblib.dump(model, 'disease_prediction_model.pkl')
joblib.dump(scaler, 'scaler.pkl')
# Evaluate the model
y_pred = model.predict(X_test)
st.write("Model Evaluation Results")
st.text(classification_report(y_test, y_pred))
# Streamlit App
st.title('Cattle Profile & Disease Prediction Dashboard')
# Register New Cow form
st.header("➕ Register New Cow")
tag_id = st.number_input("TAG ID", min_value=1, step=1)
breed = st.selectbox("Breed", cow_breeds)
age = st.number_input("Age (in years)", min_value=0, step=1)
surgery = st.text_input("Surgery")
reproduction_cycles = st.number_input("Reproduction Cycles", min_value=0, step=1)
other = st.text_input("Other Health Details")
submit = st.button("Register Cow")
if submit:
new_cow = pd.DataFrame([{
'TAG ID': tag_id,
'BREED': breed,
'AGE': age,
'SURGERY': surgery,
'REPRODUCTION CYCLES': reproduction_cycles,
'OTHER': other
}])
df = pd.concat([df, new_cow], ignore_index=True)
st.write("Cow registered successfully!")
# Select RFID dropdown to view details
st.header("🔢 Select RFID Tag ID")
selected_rfid = st.selectbox("Select RFID Tag ID", df['TAG ID'].unique())
if selected_rfid:
cow_info = df[df['TAG ID'] == selected_rfid].iloc[0]
st.write(f"**TAG ID:** {cow_info['TAG ID']}")
st.write(f"**BREED:** {cow_info['BREED']}")
st.write(f"**AGE:** {cow_info['AGE']} years")
st.write(f"**SURGERY:** {cow_info['SURGERY']}")
st.write(f"**REPRODUCTION CYCLES:** {cow_info['REPRODUCTION CYCLES']}")
st.write(f"**OTHER HEALTH DETAILS:** {cow_info['OTHER']}")
# Predict disease status based on the selected cow's data
selected_data = scaler.transform([[
cow_info['Body Temperature (°C)'],
cow_info['Rumination (min/day)'],
cow_info['Step Count (steps/day)'],
cow_info['Behavior Score (1-10)'],
cow_info['AGE']
]])
disease_prediction = model.predict(selected_data)
disease_status = "Healthy" if disease_prediction[0] == 1 else "Not Healthy"
st.write(f"Predicted Health Status: {disease_status}")
# Display cow milk yield trends
st.header("🐄 Cow Milk Yield Trends")
milk_data = {
'Tag ID': df['TAG ID'],
'Date': pd.date_range(start='2025-04-01', periods=len(df), freq='D'),
'Milk Yield (L)': np.random.uniform(10, 22, len(df)),
}
milk_df = pd.DataFrame(milk_data)
# Plot trends
st.subheader('Milk Yield Trend for Each Cow')
plt.figure(figsize=(10, 6))
sns.lineplot(data=milk_df, x='Date', y='Milk Yield (L)', hue='Tag ID', marker='o')
plt.title('Milk Yield Trend (Day-wise for Each Cow)')
plt.xlabel('Date')
plt.ylabel('Milk Yield (L)')
plt.xticks(rotation=45)
st.pyplot()
# Save updated data back to CSV
df.to_csv(DATA_FILE, index=False)