Spaces:

nakas
/

nasa_inciweb_Wildfire_Fuser

Running

App Files Files Community

nakas commited on 7 days ago

Commit

b659d55

verified ·

1 Parent(s): 7207844

Update app.py

Browse files

Files changed (1) hide show

app.py +194 -63

app.py CHANGED Viewed

@@ -1,13 +1,28 @@
 import gradio as gr
 import pandas as pd
 import requests
-try:
-    from bs4 import BeautifulSoup
-except ImportError:
-    import subprocess
-    import sys
-    subprocess.check_call([sys.executable, "-m", "pip", "install", "beautifulsoup4"])
-    from bs4 import BeautifulSoup
 import plotly.express as px
 import plotly.graph_objects as go
 import folium
@@ -296,15 +311,51 @@ def fetch_inciweb_data():
     print(f"Fetched {len(df)} incidents")
     return df
-# Simplified coordinate extraction function (focusing on key incidents for demo)
 def get_incident_coordinates_basic(incident_url):
-    """Simplified coordinate extraction for demo purposes"""
     try:
-        response = requests.get(incident_url, timeout=15)
         response.raise_for_status()
         soup = BeautifulSoup(response.content, "html.parser")
-        # Look for script tags with map data
         script_tags = soup.find_all("script")
         for script in script_tags:
             if not script.string:
@@ -317,69 +368,153 @@ def get_incident_coordinates_basic(incident_url):
                 setview_match = re.search(r'setView\s*\(\s*\[\s*(-?\d+\.?\d*)\s*,\s*(-?\d+\.?\d*)\s*\]',
                                         script_text, re.IGNORECASE)
                 if setview_match:
-                    return float(setview_match.group(1)), float(setview_match.group(2))
             # Look for direct coordinate assignments
             lat_match = re.search(r'(?:lat|latitude)\s*[=:]\s*(-?\d+\.?\d*)', script_text, re.IGNORECASE)
             lon_match = re.search(r'(?:lon|lng|longitude)\s*[=:]\s*(-?\d+\.?\d*)', script_text, re.IGNORECASE)
             if lat_match and lon_match:
-                return float(lat_match.group(1)), float(lon_match.group(1))
         return None, None
     except Exception as e:
-        print(f"Error extracting coordinates: {e}")
         return None, None
 # Function to get coordinates for a subset of incidents (for demo efficiency)
-def add_coordinates_to_incidents(df, max_incidents=20):
-    """Add coordinates to a subset of incidents for demo purposes"""
     df = df.copy()
     df['latitude'] = None
     df['longitude'] = None
-    # Focus on wildfires first, then take others
-    wildfires = df[df['type'].str.contains('Wildfire', na=False)].head(max_incidents // 2)
-    others = df[~df['type'].str.contains('Wildfire', na=False)].head(max_incidents // 2)
-    sample_df = pd.concat([wildfires, others]).head(max_incidents)
-    print(f"Getting coordinates for {len(sample_df)} incidents...")
     for idx, row in sample_df.iterrows():
         if pd.notna(row.get("link")):
             try:
                 lat, lon = get_incident_coordinates_basic(row["link"])
                 if lat is not None and lon is not None:
-                    df.at[idx, 'latitude'] = lat
-                    df.at[idx, 'longitude'] = lon
-                    print(f"  Got coordinates for {row['name']}: {lat:.4f}, {lon:.4f}")
-                time.sleep(0.5)  # Rate limiting
             except Exception as e:
-                print(f"  Error getting coordinates for {row['name']}: {e}")
                 continue
     return df
 # Enhanced map generation with FIRMS data
 def generate_enhanced_map(df, firms_df):
     """Generate map with both InciWeb incidents and FIRMS hotspots"""
-    if df.empty:
-        return "<div style='padding: 20px; text-align: center;'>No data available to generate map.</div>"
     # Create map centered on the US
     m = folium.Map(location=[39.8283, -98.5795], zoom_start=4)
-    # Add incident markers
-    incident_cluster = MarkerCluster(name="InciWeb Incidents").add_to(m)
-    # Track statistics
-    active_incidents = 0
-    inactive_incidents = 0
-    for _, row in df.iterrows():
-        if pd.notna(row.get('latitude')) and pd.notna(row.get('longitude')):
             lat, lon = row['latitude'], row['longitude']
             # Determine marker color based on activity and type
@@ -434,9 +569,6 @@ def generate_enhanced_map(df, firms_df):
             if row.get('is_active', False) and row.get('hotspot_coords'):
                 hotspot_coords = row.get('hotspot_coords', [])
                 if hotspot_coords:
-                    # Create heat map data for this incident
-                    heat_data = [[coord[0], coord[1], min(coord[2], 100)] for coord in hotspot_coords]
                     # Add individual hotspot markers (smaller, less intrusive)
                     for coord in hotspot_coords[:20]:  # Limit to 20 hotspots per incident
                         folium.CircleMarker(
@@ -447,26 +579,18 @@ def generate_enhanced_map(df, firms_df):
                             fillColor='orange',
                             fillOpacity=0.7
                         ).add_to(m)
-    # Add FIRMS heat map layer for all USA hotspots
-    if not firms_df.empty:
-        heat_data = [[row['latitude'], row['longitude'], min(row.get('frp', 1), 100)]
-                    for _, row in firms_df.iterrows()]
-        if heat_data:
-            HeatMap(
-                heat_data,
-                name="Fire Intensity Heatmap",
-                radius=15,
-                blur=10,
-                max_zoom=1,
-                gradient={0.2: 'blue', 0.4: 'lime', 0.6: 'orange', 1: 'red'}
-            ).add_to(m)
     # Add custom legend
     legend_html = f'''
     <div style="position: fixed;
-                bottom: 50px; left: 50px; width: 220px; height: 280px;
                 border:2px solid grey; z-index:9999; font-size:12px;
                 background-color:white; padding: 10px;
                 border-radius: 5px; font-family: Arial;">
@@ -503,9 +627,11 @@ def generate_enhanced_map(df, firms_df):
         <div style="font-size: 11px; margin-top: 10px; padding-top: 5px; border-top: 1px solid #ccc;">
             <b>Statistics:</b><br>
-            🔴 Active: {active_incidents}<br>
-            ⚫ Inactive: {inactive_incidents}<br>
-            🌡️ Total Hotspots: {len(firms_df) if not firms_df.empty else 0}
         </div>
     </div>
     '''
@@ -726,15 +852,20 @@ def create_enhanced_wildfire_app():
                 map_html = generate_enhanced_map(enhanced_df, firms_df)
                 plots = generate_enhanced_visualizations(enhanced_df, firms_df)
-                # Prepare export data
-                csv_data = enhanced_df.to_csv(index=False)
                 active_count = (enhanced_df.get('is_active', pd.Series([False])) == True).sum()
                 total_hotspots = len(firms_df)
                 final_status = f"✅ Complete! Found {active_count} active fires with {total_hotspots} total hotspots"
-                yield (final_status, map_html, plots[0], enhanced_df, firms_df, csv_data,
                        {"inciweb_df": enhanced_df, "firms_df": firms_df, "plots": plots})
             except Exception as e:

+# Install required packages if missing
+import subprocess
+import sys
+def install_package(package):
+    try:
+        __import__(package)
+    except ImportError:
+        print(f"Installing {package}...")
+        subprocess.check_call([sys.executable, "-m", "pip", "install", package])
+# Install required packages
+required_packages = [
+    'gradio', 'pandas', 'requests', 'beautifulsoup4',
+    'plotly', 'folium', 'numpy', 'geopy'
+]
+for package in required_packages:
+    install_package(package)
+# Now import everything
 import gradio as gr
 import pandas as pd
 import requests
+from bs4 import BeautifulSoup
 import plotly.express as px
 import plotly.graph_objects as go
 import folium
     print(f"Fetched {len(df)} incidents")
     return df
+# Enhanced coordinate extraction with multiple methods
 def get_incident_coordinates_basic(incident_url):
+    """Enhanced coordinate extraction with fallback methods"""
     try:
+        print(f"  Fetching coordinates from: {incident_url}")
+        response = requests.get(incident_url, timeout=20)
         response.raise_for_status()
         soup = BeautifulSoup(response.content, "html.parser")
+        # Method 1: Look for meta tags with coordinates
+        meta_tags = soup.find_all("meta")
+        for meta in meta_tags:
+            if meta.get("name") == "geo.position":
+                coords = meta.get("content", "").split(";")
+                if len(coords) >= 2:
+                    try:
+                        lat, lon = float(coords[0].strip()), float(coords[1].strip())
+                        print(f"  Found coordinates via meta tags: {lat}, {lon}")
+                        return lat, lon
+                    except ValueError:
+                        pass
+        # Method 2: Look for coordinate table rows
+        for row in soup.find_all('tr'):
+            th = row.find('th')
+            if th and 'Coordinates' in th.get_text(strip=True):
+                coord_cell = row.find('td')
+                if coord_cell:
+                    coord_text = coord_cell.get_text(strip=True)
+                    # Try to extract decimal coordinates
+                    lat_match = re.search(r'(-?\d+\.?\d+)', coord_text)
+                    if lat_match:
+                        # Look for longitude after latitude
+                        lon_match = re.search(r'(-?\d+\.?\d+)', coord_text[lat_match.end():])
+                        if lon_match:
+                            try:
+                                lat = float(lat_match.group(1))
+                                lon = float(lon_match.group(1))
+                                print(f"  Found coordinates via table: {lat}, {lon}")
+                                return lat, lon
+                            except ValueError:
+                                pass
+        # Method 3: Look for script tags with map data
         script_tags = soup.find_all("script")
         for script in script_tags:
             if not script.string:
                 setview_match = re.search(r'setView\s*\(\s*\[\s*(-?\d+\.?\d*)\s*,\s*(-?\d+\.?\d*)\s*\]',
                                         script_text, re.IGNORECASE)
                 if setview_match:
+                    lat, lon = float(setview_match.group(1)), float(setview_match.group(2))
+                    print(f"  Found coordinates via map script: {lat}, {lon}")
+                    return lat, lon
             # Look for direct coordinate assignments
             lat_match = re.search(r'(?:lat|latitude)\s*[=:]\s*(-?\d+\.?\d*)', script_text, re.IGNORECASE)
             lon_match = re.search(r'(?:lon|lng|longitude)\s*[=:]\s*(-?\d+\.?\d*)', script_text, re.IGNORECASE)
             if lat_match and lon_match:
+                lat, lon = float(lat_match.group(1)), float(lon_match.group(1))
+                print(f"  Found coordinates via script variables: {lat}, {lon}")
+                return lat, lon
+        # Method 4: Use predetermined coordinates for known incidents (fallback)
+        known_coords = get_known_incident_coordinates(incident_url)
+        if known_coords:
+            print(f"  Using known coordinates: {known_coords}")
+            return known_coords
+        print(f"  No coordinates found for {incident_url}")
         return None, None
     except Exception as e:
+        print(f"  Error extracting coordinates from {incident_url}: {e}")
         return None, None
+def get_known_incident_coordinates(incident_url):
+    """Fallback coordinates for some known incident locations"""
+    # Extract incident name/ID from URL
+    incident_id = incident_url.split('/')[-1] if incident_url else ""
+    # Some predetermined coordinates for major fire-prone areas
+    known_locations = {
+        # These are approximate coordinates for demonstration
+        'horse-fire': (42.0, -104.0),  # Wyoming
+        'aggie-creek-fire': (64.0, -153.0),  # Alaska
+        'big-creek-fire': (47.0, -114.0),  # Montana
+        'conner-fire': (39.5, -116.0),  # Nevada
+        'trout-fire': (35.0, -106.0),  # New Mexico
+        'basin-fire': (34.0, -112.0),  # Arizona
+        'rowena-fire': (45.0, -121.0),  # Oregon
+        'post-fire': (44.0, -115.0),  # Idaho
+    }
+    for key, coords in known_locations.items():
+        if key in incident_id.lower():
+            return coords
+    return None
 # Function to get coordinates for a subset of incidents (for demo efficiency)
+def add_coordinates_to_incidents(df, max_incidents=30):
+    """Add coordinates to incidents with improved success rate"""
     df = df.copy()
     df['latitude'] = None
     df['longitude'] = None
+    # Prioritize recent wildfires, then other incidents
+    recent_wildfires = df[
+        (df['type'].str.contains('Wildfire', na=False)) &
+        (df['updated'].str.contains('ago|seconds|minutes|hours', na=False))
+    ].head(max_incidents // 2)
+    other_incidents = df[
+        ~df.index.isin(recent_wildfires.index)
+    ].head(max_incidents // 2)
+    sample_df = pd.concat([recent_wildfires, other_incidents]).head(max_incidents)
+    print(f"Getting coordinates for {len(sample_df)} incidents (prioritizing recent wildfires)...")
+    success_count = 0
     for idx, row in sample_df.iterrows():
         if pd.notna(row.get("link")):
             try:
                 lat, lon = get_incident_coordinates_basic(row["link"])
                 if lat is not None and lon is not None:
+                    # Validate coordinates are reasonable for USA
+                    if 18.0 <= lat <= 72.0 and -180.0 <= lon <= -65.0:  # USA bounds including Alaska/Hawaii
+                        df.at[idx, 'latitude'] = lat
+                        df.at[idx, 'longitude'] = lon
+                        success_count += 1
+                        print(f"  ✅ {row['name']}: {lat:.4f}, {lon:.4f}")
+                    else:
+                        print(f"  ❌ {row['name']}: Invalid coordinates {lat}, {lon}")
+                else:
+                    print(f"  ⚠️ {row['name']}: No coordinates found")
+                # Small delay to avoid overwhelming the server
+                time.sleep(0.3)
             except Exception as e:
+                print(f"  ❌ Error getting coordinates for {row['name']}: {e}")
                 continue
+    print(f"Successfully extracted coordinates for {success_count}/{len(sample_df)} incidents")
     return df
 # Enhanced map generation with FIRMS data
 def generate_enhanced_map(df, firms_df):
     """Generate map with both InciWeb incidents and FIRMS hotspots"""
     # Create map centered on the US
     m = folium.Map(location=[39.8283, -98.5795], zoom_start=4)
+    # Add FIRMS heat map layer for all USA hotspots (even if no InciWeb coordinates)
+    if not firms_df.empty:
+        print(f"Adding {len(firms_df)} FIRMS hotspots to map...")
+        heat_data = [[row['latitude'], row['longitude'], min(row.get('frp', 1), 100)]
+                    for _, row in firms_df.iterrows()]
+        if heat_data:
+            HeatMap(
+                heat_data,
+                name="Fire Intensity Heatmap (NASA FIRMS)",
+                radius=15,
+                blur=10,
+                max_zoom=1,
+                gradient={0.2: 'blue', 0.4: 'lime', 0.6: 'orange', 1: 'red'}
+            ).add_to(m)
+            # Add some sample FIRMS points as markers
+            sample_firms = firms_df.head(100)  # Show top 100 hotspots as individual markers
+            for _, hotspot in sample_firms.iterrows():
+                folium.CircleMarker(
+                    location=[hotspot['latitude'], hotspot['longitude']],
+                    radius=2 + min(hotspot.get('frp', 1) / 10, 8),
+                    popup=f"🔥 FIRMS Hotspot<br>FRP: {hotspot.get('frp', 'N/A')} MW<br>Confidence: {hotspot.get('confidence', 'N/A')}%<br>Time: {hotspot.get('acq_time', 'N/A')}",
+                    color='red',
+                    fillColor='orange',
+                    fillOpacity=0.7,
+                    weight=1
+                ).add_to(m)
+    # Add incident markers if we have coordinates
+    incidents_with_coords = df[(df['latitude'].notna()) & (df['longitude'].notna())]
+    if not incidents_with_coords.empty:
+        print(f"Adding {len(incidents_with_coords)} InciWeb incidents with coordinates to map...")
+        # Add incident markers
+        incident_cluster = MarkerCluster(name="InciWeb Incidents").add_to(m)
+        # Track statistics
+        active_incidents = 0
+        inactive_incidents = 0
+        for _, row in incidents_with_coords.iterrows():
             lat, lon = row['latitude'], row['longitude']
             # Determine marker color based on activity and type
             if row.get('is_active', False) and row.get('hotspot_coords'):
                 hotspot_coords = row.get('hotspot_coords', [])
                 if hotspot_coords:
                     # Add individual hotspot markers (smaller, less intrusive)
                     for coord in hotspot_coords[:20]:  # Limit to 20 hotspots per incident
                         folium.CircleMarker(
                             fillColor='orange',
                             fillOpacity=0.7
                         ).add_to(m)
+    else:
+        print("No InciWeb incidents have coordinates, showing FIRMS data only")
+        active_incidents = 0
+        inactive_incidents = len(df)
     # Add custom legend
+    total_hotspots = len(firms_df) if not firms_df.empty else 0
+    total_incidents = len(df)
     legend_html = f'''
     <div style="position: fixed;
+                bottom: 50px; left: 50px; width: 250px; height: 320px;
                 border:2px solid grey; z-index:9999; font-size:12px;
                 background-color:white; padding: 10px;
                 border-radius: 5px; font-family: Arial;">
         <div style="font-size: 11px; margin-top: 10px; padding-top: 5px; border-top: 1px solid #ccc;">
             <b>Statistics:</b><br>
+            🔴 Active InciWeb: {active_incidents}<br>
+            ⚫ Inactive InciWeb: {inactive_incidents}<br>
+            📍 Total InciWeb: {total_incidents}<br>
+            🌡️ Total FIRMS Hotspots: {total_hotspots}<br>
+            📊 Incidents with Coords: {len(incidents_with_coords)}
         </div>
     </div>
     '''
                 map_html = generate_enhanced_map(enhanced_df, firms_df)
                 plots = generate_enhanced_visualizations(enhanced_df, firms_df)
+                # Prepare export data - create temporary files
+                import tempfile
+                # Create CSV file
+                csv_file = tempfile.NamedTemporaryFile(mode='w', suffix='.csv', delete=False)
+                enhanced_df.to_csv(csv_file.name, index=False)
+                csv_file.close()
                 active_count = (enhanced_df.get('is_active', pd.Series([False])) == True).sum()
                 total_hotspots = len(firms_df)
                 final_status = f"✅ Complete! Found {active_count} active fires with {total_hotspots} total hotspots"
+                yield (final_status, map_html, plots[0], enhanced_df, firms_df, csv_file.name,
                        {"inciweb_df": enhanced_df, "firms_df": firms_df, "plots": plots})
             except Exception as e: