File size: 9,341 Bytes
8ba57d6
 
8023c2d
 
8ba57d6
8023c2d
 
8ba57d6
8023c2d
8ba57d6
 
8023c2d
 
 
 
 
 
fc818a1
8023c2d
 
 
 
728b9e0
8023c2d
 
 
728b9e0
8023c2d
 
 
 
afb3711
8023c2d
 
afb3711
8023c2d
 
 
11eee3c
ba1686c
 
11eee3c
ba1686c
11eee3c
 
20e589d
11eee3c
 
 
 
 
 
 
 
 
 
 
8023c2d
 
11eee3c
8023c2d
 
 
 
 
 
20e589d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
11eee3c
ba1686c
11eee3c
afb3711
11eee3c
8023c2d
afb3711
11eee3c
 
 
 
 
 
 
 
afb3711
11eee3c
 
 
 
20e589d
11eee3c
 
 
 
 
 
 
 
 
8023c2d
 
11eee3c
8023c2d
11eee3c
8023c2d
11eee3c
 
 
 
 
8023c2d
 
11eee3c
8023c2d
 
11eee3c
 
 
8023c2d
 
 
8ba57d6
8023c2d
8ba57d6
8023c2d
89e980a
8023c2d
 
 
d453c25
20e589d
 
 
8023c2d
 
20e589d
 
d453c25
6bf06e3
20e589d
 
8023c2d
 
20e589d
 
d453c25
6bf06e3
8023c2d
 
20e589d
8023c2d
 
 
 
 
 
 
 
 
 
 
 
 
 
20e589d
8023c2d
 
 
 
 
 
 
8ba57d6
8023c2d
8ba57d6
8023c2d
 
 
 
20e589d
 
8023c2d
 
8ba57d6
8023c2d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8ba57d6
20e589d
8023c2d
 
20e589d
 
 
8023c2d
 
20e589d
8023c2d
20e589d
 
 
8023c2d
 
d453c25
8023c2d
 
 
 
 
20e589d
 
8023c2d
 
 
 
20e589d
 
8023c2d
20e589d
8023c2d
 
 
 
 
 
 
 
d453c25
 
8023c2d
8ba57d6
8023c2d
 
20e589d
 
8023c2d
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
import streamlit as st
import pandas as pd
import pydeck as pdk
import math

# --- PAGE CONFIGURATION ---
st.set_page_config(layout="wide", page_title="Frontier AI Emissions Map")

# --- CUSTOM CSS FOR METRICS & STYLE ---
st.markdown("""
<style>
    .metric-card {
        background-color: #1E1E1E;
        border: 1px solid #333;
        border-radius: 8px;
        padding: 15px;
        margin-bottom: 10px;
    }
    .metric-value {
        font-size: 24px;
        font-weight: bold;
        color: #FFFFFF;
    }
    .metric-label {
        font-size: 14px;
        color: #AAAAAA;
    }
    /* Tooltip styling logic happens in PyDeck, but general text style */
    body {
        color: #E0E0E0;
        background-color: #0E1117;
    }
</style>
""", unsafe_allow_html=True)

# --- 1. DATA LOADING & CLEANING ---
@st.cache_data
def load_data():
    try:
        # Load data, skipping the first empty row (header=1 means Row 2 is the header)
        df = pd.read_csv("Frontier AI DC Emissions - Frontier Timeline.csv", header=1)
        
        # Sanitize Headers (removes hidden spaces)
        df.columns = df.columns.str.strip()
        
        # Validation
        required_cols = ['Power (MW)', 'Carbon Intensity', 'Annual Million tCO2']
        missing = [c for c in required_cols if c not in df.columns]
        if missing:
            st.error(f"❌ Missing columns: {missing}. Found columns: {df.columns.tolist()}")
            st.stop()

    except FileNotFoundError:
        st.error("❌ File not found. Please ensure 'Frontier AI DC Emissions - Frontier Timeline.csv' is uploaded.")
        st.stop()

    # --- Data Cleaning ---
    def clean_numeric(val):
        if isinstance(val, str):
            val = val.replace(',', '').replace('"', '').strip()
        return pd.to_numeric(val, errors='coerce')

    df['Power (MW)'] = df['Power (MW)'].apply(clean_numeric)
    df['Carbon Intensity'] = df['Carbon Intensity'].apply(clean_numeric)
    df['Annual Million tCO2'] = df['Annual Million tCO2'].apply(clean_numeric)

    # --- CLEAN OWNER NAMES ---
    # Remove "#confident", "#likely", etc.
    if 'Owner' in df.columns:
        df['Owner'] = df['Owner'].astype(str).str.split('#').str[0].str.strip()

    # --- SIMPLIFY GRID STATUS ---
    # Create a clean category for the filter (Grid vs Off-Grid vs Hybrid)
    def simplify_status(status):
        s = str(status).lower()
        if 'off-grid' in s or 'gas' in s: return "Off-Grid / Fossil"
        elif 'hybrid' in s or 'nuclear' in s: return "Hybrid / Nuclear"
        elif 'grid' in s: return "Grid Connected"
        else: return "Unknown"
    
    df['Simple_Connection'] = df['Grid Status'].apply(simplify_status)

    # --- MATH CHECK ---
    # Formula: MW * 8760 hours * (Intensity kg/MWh / 1000 to get tonnes) / 1,000,000 to get Million Tonnes
    # We calculate this to double-check the CSV's reported numbers
    df['Calculated_Mt'] = (df['Power (MW)'] * 8760 * df['Carbon Intensity']) / 1e9
    
    # Use the Reported number, but normalize it (Handle the 13,093 vs 13.1 issue)
    df['Emissions_Mt'] = df['Annual Million tCO2'].apply(lambda x: x / 1000 if x > 100 else x)
    
    # --- Geocoding (Manual Overrides for missing Lat/Long) ---
    overrides = {
        'Fermi': [35.344, -101.373],       # Amarillo, TX
        'Crane': [40.154, -76.725],        # Three Mile Island
        'CleanArc': [38.005, -77.478],     # Caroline County, VA
        'Vantage': [38.381, -77.495],      # Fredericksburg, VA
        'Stargate': [42.167, -83.850]      # Michigan
    }
    
    for key, coords in overrides.items():
        mask = df['Project'].astype(str).str.contains(key, case=False, na=False)
        df.loc[mask, ['Latitude', 'Longitude']] = coords

    # Parse DMS coordinates
    def dms_to_dd(val):
        if isinstance(val, str) and '°' in val:
            try:
                parts = val.replace('°', ' ').replace("'", ' ').replace('"', ' ').split()
                dd = float(parts[0]) + float(parts[1])/60 + (float(parts[2]) if len(parts)>2 else 0)/3600
                if 'S' in val or 'W' in val: dd *= -1
                return dd
            except: return None
        return val

    for col in ['Latitude', 'Longitude']:
        df[col] = df[col].apply(dms_to_dd)
        df[col] = pd.to_numeric(df[col], errors='coerce')

    df = df.dropna(subset=['Latitude', 'Longitude'])

    # --- Enrichment for Tooltip ---
    # Cars: 1 MtCO2 ≈ 217,000 cars (4.6t/car/yr)
    df['Cars_Equivalent_Millions'] = (df['Emissions_Mt'] * 1_000_000 / 4.6 / 1_000_000).round(2)
    # Coal Plants: 1 Coal Plant ≈ 4.0 MtCO2
    df['Coal_Plants_Equivalent'] = (df['Emissions_Mt'] / 4.0).round(1)

    # Visual Attributes
    def get_color(status):
        s = str(status).lower()
        if 'off-grid' in s or 'gas' in s: return [255, 65, 54, 200]  # Red
        elif 'hybrid' in s or 'nuclear' in s: return [255, 133, 27, 200] # Orange
        else: return [0, 116, 217, 200]  # Blue

    df['color'] = df['Grid Status'].apply(get_color)
    df['radius'] = df['Emissions_Mt'].apply(lambda x: math.sqrt(x) * 15000) 

    return df

df = load_data()

# --- SIDEBAR CONTROLS ---
st.sidebar.header("🌍 Frontier AI Emissions")
st.sidebar.markdown("Filter the map to analyze the carbon footprint of planned AI infrastructure.")

# Filters: Connection Type (Simplified)
# We sort them to ensure consistent order
connection_options = sorted(df['Simple_Connection'].unique())
grid_filter = st.sidebar.multiselect(
    "Connection Type",
    options=connection_options,
    default=connection_options
)

# Filters: Owner (Cleaned)
owner_options = sorted(df['Owner'].unique())
owner_filter = st.sidebar.multiselect(
    "Owner",
    options=owner_options,
    default=owner_options
)

# Apply filters
filtered_df = df[
    (df['Simple_Connection'].isin(grid_filter)) & 
    (df['Owner'].isin(owner_filter))
]

# --- SCORECARD METRICS ---
total_power = filtered_df['Power (MW)'].sum() / 1000 # GW
total_emissions = filtered_df['Emissions_Mt'].sum()
total_cars = filtered_df['Cars_Equivalent_Millions'].sum()
avg_intensity = filtered_df['Carbon Intensity'].mean()

st.sidebar.divider()
st.sidebar.markdown("### 📊 Aggregate Impact")

col1, col2 = st.sidebar.columns(2)
col1.metric("Total Power", f"{total_power:.1f} GW", help="Total capacity of visible projects")
col2.metric("Annual Emissions", f"{total_emissions:.1f} Mt", help="Million Tonnes CO2e/year")

st.sidebar.markdown(f"""
<div class="metric-card">
    <div class="metric-label">🚗 Equivalent Traffic Added</div>
    <div class="metric-value">{total_cars:.1f} Million Cars</div>
</div>
""", unsafe_allow_html=True)

st.sidebar.markdown(f"**Avg Carbon Intensity:** {avg_intensity:.0f} kg/MWh")

# --- MAIN MAP ---
st.title("The Carbon Footprint of Frontier AI")
st.markdown(
    "This map visualizes the annual emissions of major planned AI data centers. "
    "**Bubble size** represents CO₂e emissions. **Color** indicates grid status "
    "(<span style='color:#FF4136'><b>Red = Off-Grid/Fossil</b></span>, <span style='color:#0074D9'><b>Blue = Grid Connected</b></span>).",
    unsafe_allow_html=True
)

# PyDeck Layer
layer = pdk.Layer(
    "ScatterplotLayer",
    filtered_df,
    get_position="[Longitude, Latitude]",
    get_radius="radius",
    get_fill_color="color",
    pickable=True,
    opacity=0.8,
    stroked=True,
    filled=True,
    radius_min_pixels=5,
    radius_max_pixels=100,
    line_width_min_pixels=1,
    get_line_color=[0, 0, 0],
)

# Tooltip (Updated for Data Center Name & Subscript)
tooltip = {
    "html": """
        <div style="font-family: sans-serif; padding: 8px; color: white; max-width: 250px;">
            <h4 style="margin:0; padding-bottom:5px;">{Data Center Name}</h4>
            <hr style="border-top: 1px solid #555; margin: 5px 0;">
            <b>Owner:</b> {Owner}<br/>
            <b>Power:</b> {Power (MW)} MW<br/>
            <b>Status:</b> {Simple_Connection}<br/>
            <br/>
            <b style="font-size: 1.1em; color: #ffcccb;">Emissions: {Emissions_Mt} MtCO<sub>2</sub>e</b><br/>
            <i style="font-size: 0.8em; color: #ccc;">(Intensity: {Carbon Intensity} kg/MWh)</i>
            <hr style="border-top: 1px dashed #555; margin: 5px 0;">
            <b>🚗 Equal to:</b> {Cars_Equivalent_Millions} Million Cars<br/>
            <b>🏭 Equal to:</b> {Coal_Plants_Equivalent} Coal Power Plants
        </div>
    """,
    "style": {
        "backgroundColor": "#1E1E1E",
        "border": "1px solid #333",
        "borderRadius": "8px",
        "color": "white",
        "zIndex": "1000"
    }
}

# Render Map
# FIX: Removed 'mapbox://' style to prevent black screen. 
# Using map_style=None uses the default adaptable map.
st.pydeck_chart(pdk.Deck(
    map_style=None, 
    initial_view_state=pdk.ViewState(
        latitude=39.8,
        longitude=-98.6,
        zoom=3.5,
        pitch=0,
    ),
    layers=[layer],
    tooltip=tooltip
))

# --- FOOTER / SOURCE ---
st.markdown("---")
st.caption(
    "**Methodology:** Emissions calculated based on publicly stated power capacity (MW) and regional/source-specific carbon intensity. "
    "Car equivalents assume 4.6 metric tonnes CO₂e per passenger vehicle per year (EPA). "
    "Coal plant equivalent assumes ~4.0 MtCO₂e/year for a typical plant."
)