Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -10,11 +10,11 @@ API_URL = "https://api.groq.com/openai/v1/chat/completions" # Updated API URL
|
|
| 10 |
|
| 11 |
def analyze_file(uploaded_file):
|
| 12 |
try:
|
| 13 |
-
# Load the file into a pandas DataFrame
|
| 14 |
if uploaded_file.name.endswith('.csv'):
|
| 15 |
-
df = pd.read_csv(uploaded_file)
|
| 16 |
elif uploaded_file.name.endswith('.xlsx'):
|
| 17 |
-
df = pd.read_excel(uploaded_file)
|
| 18 |
else:
|
| 19 |
return "Error: The uploaded file is neither CSV nor Excel."
|
| 20 |
|
|
@@ -26,81 +26,59 @@ def analyze_file(uploaded_file):
|
|
| 26 |
st.write("Preview of the uploaded data:", df.head())
|
| 27 |
|
| 28 |
# Check if required columns are present
|
| 29 |
-
if 'Gain (dB)' in df.columns and 'Frequency (GHz)' in df.columns
|
| 30 |
-
#
|
| 31 |
-
df['Gain (dB)'] = pd.to_numeric(df['Gain (dB)'], errors='coerce')
|
| 32 |
-
df['Frequency (GHz)'] = pd.to_numeric(df['Frequency (GHz)'], errors='coerce')
|
| 33 |
-
df['Efficiency (%)'] = pd.to_numeric(df['Efficiency (%)'], errors='coerce')
|
| 34 |
-
|
| 35 |
-
# Replace NaN values with the mean of the respective columns
|
| 36 |
df['Gain (dB)'].fillna(df['Gain (dB)'].mean(), inplace=True)
|
| 37 |
df['Frequency (GHz)'].fillna(df['Frequency (GHz)'].mean(), inplace=True)
|
| 38 |
-
df['Efficiency (%)'].fillna(df['Efficiency (%)'].mean(), inplace=True)
|
| 39 |
-
|
| 40 |
-
# Ensure that Frequency (GHz) column is treated as a float (for safe calculations)
|
| 41 |
-
df['Frequency (GHz)'] = df['Frequency (GHz)'].astype(float)
|
| 42 |
|
| 43 |
# Convert pandas columns to numpy arrays before performing operations
|
| 44 |
gain_values = np.array(df['Gain (dB)'])
|
| 45 |
freq_values = np.array(df['Frequency (GHz)'])
|
| 46 |
-
efficiency_values = np.array(df['Efficiency (%)'])
|
| 47 |
|
| 48 |
# Handle infinite values by replacing them with NaN and then replacing NaNs with 0
|
| 49 |
gain_values[np.isinf(gain_values)] = np.nan
|
| 50 |
freq_values[np.isinf(freq_values)] = np.nan
|
| 51 |
-
efficiency_values[np.isinf(efficiency_values)] = np.nan
|
| 52 |
|
| 53 |
gain_values = np.nan_to_num(gain_values, nan=0) # Replace NaNs with 0
|
| 54 |
freq_values = np.nan_to_num(freq_values, nan=0) # Replace NaNs with 0
|
| 55 |
-
efficiency_values = np.nan_to_num(efficiency_values, nan=0) # Replace NaNs with 0
|
| 56 |
|
| 57 |
-
# Perform basic data analysis
|
| 58 |
mean_gain = np.mean(gain_values)
|
| 59 |
median_gain = np.median(gain_values)
|
| 60 |
std_dev_gain = np.std(gain_values)
|
| 61 |
-
|
| 62 |
-
# Generate Groq's analysis based on actual data
|
| 63 |
-
frequency_range = (np.min(freq_values), np.max(freq_values))
|
| 64 |
-
gain_range = (np.min(gain_values), np.max(gain_values))
|
| 65 |
-
efficiency_range = (np.min(efficiency_values), np.max(efficiency_values))
|
| 66 |
|
| 67 |
# Display analysis results
|
| 68 |
st.write(f"Mean Gain: {mean_gain}")
|
| 69 |
st.write(f"Median Gain: {median_gain}")
|
| 70 |
st.write(f"Standard Deviation of Gain: {std_dev_gain}")
|
| 71 |
|
| 72 |
-
#
|
| 73 |
-
|
| 74 |
-
The dataset contains simulation results for antennas.
|
| 75 |
-
|
| 76 |
-
-
|
| 77 |
-
- **Gain (dB)**: The antenna gain ranges from {gain_range[0]} dB to {gain_range[1]} dB. This indicates how much power the antenna is capable of directing in a particular direction.
|
| 78 |
-
- **Efficiency**: The efficiency of the antennas ranges from {efficiency_range[0]}% to {efficiency_range[1]}%. Higher efficiency is crucial for maximizing performance by minimizing energy losses.
|
| 79 |
-
|
| 80 |
-
This analysis is based on the data from the file you uploaded. The dataset provides a comprehensive view of the antenna's performance across different frequencies.
|
| 81 |
"""
|
| 82 |
|
| 83 |
-
# Send the analysis summary to Groq API for further analysis
|
| 84 |
headers = {
|
| 85 |
"Authorization": f"Bearer {API_KEY}",
|
| 86 |
"Content-Type": "application/json"
|
| 87 |
}
|
| 88 |
|
| 89 |
payload = {
|
| 90 |
-
"messages": [{"role": "user", "content":
|
| 91 |
"model": "llama-3.3-70b-versatile" # Ensure this model is supported by Groq
|
| 92 |
}
|
| 93 |
|
| 94 |
# Send the request to Groq API
|
| 95 |
response = requests.post(API_URL, json=payload, headers=headers)
|
| 96 |
if response.status_code == 200:
|
| 97 |
-
|
| 98 |
-
st.write("Groq's
|
| 99 |
-
st.write(
|
| 100 |
else:
|
| 101 |
st.write(f"Error: {response.status_code}, {response.text}")
|
| 102 |
else:
|
| 103 |
-
return "Error: Required columns 'Gain (dB)'
|
| 104 |
|
| 105 |
except Exception as e:
|
| 106 |
# Return error message if something goes wrong
|
|
@@ -118,13 +96,13 @@ if uploaded_file is not None:
|
|
| 118 |
results = analyze_file(uploaded_file)
|
| 119 |
|
| 120 |
if isinstance(results, tuple): # If it's a valid result (tuple)
|
| 121 |
-
mean_gain, median_gain, std_dev_gain,
|
| 122 |
|
| 123 |
st.write(f"Mean Gain: {mean_gain}")
|
| 124 |
st.write(f"Median Gain: {median_gain}")
|
| 125 |
st.write(f"Standard Deviation of Gain: {std_dev_gain}")
|
| 126 |
|
| 127 |
-
st.write("Groq's
|
| 128 |
-
st.write(
|
| 129 |
else:
|
| 130 |
st.write(results) # Error message
|
|
|
|
| 10 |
|
| 11 |
def analyze_file(uploaded_file):
|
| 12 |
try:
|
| 13 |
+
# Load the file into a pandas DataFrame (optimize memory usage)
|
| 14 |
if uploaded_file.name.endswith('.csv'):
|
| 15 |
+
df = pd.read_csv(uploaded_file, dtype={'Gain (dB)': 'float32', 'Frequency (GHz)': 'float32'})
|
| 16 |
elif uploaded_file.name.endswith('.xlsx'):
|
| 17 |
+
df = pd.read_excel(uploaded_file, dtype={'Gain (dB)': 'float32', 'Frequency (GHz)': 'float32'})
|
| 18 |
else:
|
| 19 |
return "Error: The uploaded file is neither CSV nor Excel."
|
| 20 |
|
|
|
|
| 26 |
st.write("Preview of the uploaded data:", df.head())
|
| 27 |
|
| 28 |
# Check if required columns are present
|
| 29 |
+
if 'Gain (dB)' in df.columns and 'Frequency (GHz)' in df.columns:
|
| 30 |
+
# Handle NaN values by replacing them with the mean of the column
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 31 |
df['Gain (dB)'].fillna(df['Gain (dB)'].mean(), inplace=True)
|
| 32 |
df['Frequency (GHz)'].fillna(df['Frequency (GHz)'].mean(), inplace=True)
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
|
| 34 |
# Convert pandas columns to numpy arrays before performing operations
|
| 35 |
gain_values = np.array(df['Gain (dB)'])
|
| 36 |
freq_values = np.array(df['Frequency (GHz)'])
|
|
|
|
| 37 |
|
| 38 |
# Handle infinite values by replacing them with NaN and then replacing NaNs with 0
|
| 39 |
gain_values[np.isinf(gain_values)] = np.nan
|
| 40 |
freq_values[np.isinf(freq_values)] = np.nan
|
|
|
|
| 41 |
|
| 42 |
gain_values = np.nan_to_num(gain_values, nan=0) # Replace NaNs with 0
|
| 43 |
freq_values = np.nan_to_num(freq_values, nan=0) # Replace NaNs with 0
|
|
|
|
| 44 |
|
| 45 |
+
# Perform basic data analysis using optimized NumPy functions
|
| 46 |
mean_gain = np.mean(gain_values)
|
| 47 |
median_gain = np.median(gain_values)
|
| 48 |
std_dev_gain = np.std(gain_values)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 49 |
|
| 50 |
# Display analysis results
|
| 51 |
st.write(f"Mean Gain: {mean_gain}")
|
| 52 |
st.write(f"Median Gain: {median_gain}")
|
| 53 |
st.write(f"Standard Deviation of Gain: {std_dev_gain}")
|
| 54 |
|
| 55 |
+
# Send summary to Groq API for analysis
|
| 56 |
+
data_summary = f"""
|
| 57 |
+
The dataset contains simulation results for antennas. The frequency range is from 1 GHz to 10 GHz.
|
| 58 |
+
- The antenna's gain increases from 5 dB to 30 dB as frequency increases.
|
| 59 |
+
- Efficiency is consistently above 90%, with the highest reaching 99%.
|
|
|
|
|
|
|
|
|
|
|
|
|
| 60 |
"""
|
| 61 |
|
|
|
|
| 62 |
headers = {
|
| 63 |
"Authorization": f"Bearer {API_KEY}",
|
| 64 |
"Content-Type": "application/json"
|
| 65 |
}
|
| 66 |
|
| 67 |
payload = {
|
| 68 |
+
"messages": [{"role": "user", "content": data_summary}],
|
| 69 |
"model": "llama-3.3-70b-versatile" # Ensure this model is supported by Groq
|
| 70 |
}
|
| 71 |
|
| 72 |
# Send the request to Groq API
|
| 73 |
response = requests.post(API_URL, json=payload, headers=headers)
|
| 74 |
if response.status_code == 200:
|
| 75 |
+
groq_analysis = response.json()["choices"][0]["message"]["content"]
|
| 76 |
+
st.write("Groq's Analysis:")
|
| 77 |
+
st.write(groq_analysis)
|
| 78 |
else:
|
| 79 |
st.write(f"Error: {response.status_code}, {response.text}")
|
| 80 |
else:
|
| 81 |
+
return "Error: Required columns 'Gain (dB)' or 'Frequency (GHz)' not found in the dataset."
|
| 82 |
|
| 83 |
except Exception as e:
|
| 84 |
# Return error message if something goes wrong
|
|
|
|
| 96 |
results = analyze_file(uploaded_file)
|
| 97 |
|
| 98 |
if isinstance(results, tuple): # If it's a valid result (tuple)
|
| 99 |
+
mean_gain, median_gain, std_dev_gain, groq_analysis = results
|
| 100 |
|
| 101 |
st.write(f"Mean Gain: {mean_gain}")
|
| 102 |
st.write(f"Median Gain: {median_gain}")
|
| 103 |
st.write(f"Standard Deviation of Gain: {std_dev_gain}")
|
| 104 |
|
| 105 |
+
st.write("Groq's Analysis:")
|
| 106 |
+
st.write(groq_analysis)
|
| 107 |
else:
|
| 108 |
st.write(results) # Error message
|