Spaces:

YashMK89
/

GEE_Calculator

Running

App Files Files Community

YashMK89 commited on Nov 28, 2024

Commit

7a7dd74

verified ·

1 Parent(s): 8b8d12a

update app.py

Browse files

Files changed (1) hide show

app.py +474 -320

app.py CHANGED Viewed

@@ -53,24 +53,32 @@ with open(os.path.expanduser("~/.config/earthengine/credentials"), "w") as f:
 ee.Initialize(project='ee-yashsacisro24')
-# Load Sentinel dataset options from JSON file
 with open("sentinel_datasets.json") as f:
     data = json.load(f)
-# Display the title and dataset selection
 st.title("Sentinel Dataset")
-# Select dataset category and subcategory (case-insensitive selection)
 main_selection = st.selectbox("Select Sentinel Dataset Category", list(data.keys()))
 if main_selection:
     sub_options = data[main_selection]["sub_options"]
     sub_selection = st.selectbox("Select Specific Dataset ID", list(sub_options.keys()))
 # Earth Engine Index Calculator Section
 st.header("Earth Engine Index Calculator")
-# Choose Index or Custom Formula (case-insensitive)
 index_choice = st.selectbox("Select an Index or Enter Custom Formula", ['NDVI', 'NDWI', 'Average NO₂', 'Custom Formula'])
 # Initialize custom_formula variable
@@ -84,10 +92,31 @@ elif index_choice.lower() == 'ndwi':
 elif index_choice.lower() == 'average no₂':
     st.write("Formula for Average NO₂: Average NO₂ = Mean(NO2 band)")
 elif index_choice.lower() == 'custom formula':
-    custom_formula = st.text_input("Enter Custom Formula (e.g., '(B5 - B4) / (B5 + B4)')")
-    st.write(f"Custom Formula: {custom_formula}")  # Display the custom formula after the user inputs it
-# Reducer selection
 reducer_choice = st.selectbox(
     "Select Reducer",
     ['mean', 'sum', 'median', 'min', 'max', 'count'],
@@ -123,6 +152,93 @@ shape_type = st.selectbox("Do you want to process 'Point' or 'Polygon' data?", [
 # Ask user to upload a file based on shape type (case-insensitive)
 file_upload = st.file_uploader(f"Upload your {shape_type} data (CSV, GeoJSON, KML)", type=["csv", "geojson", "kml"])
 # Date Input for Start and End Dates
 start_date = st.date_input("Start Date", value=pd.to_datetime('2020-01-01'))
 end_date = st.date_input("End Date", value=pd.to_datetime('2020-12-31'))
@@ -131,6 +247,9 @@ end_date = st.date_input("End Date", value=pd.to_datetime('2020-12-31'))
 start_date_str = start_date.strftime('%Y-%m-%d')
 end_date_str = end_date.strftime('%Y-%m-%d')
 # Initialize session state for storing results if not already done
 if 'results' not in st.session_state:
     st.session_state.results = []
@@ -143,7 +262,7 @@ if 'map_data' not in st.session_state:
 def parameters_changed():
     return (
         st.session_state.last_params.get('main_selection') != main_selection or
-        st.session_state.last_params.get('sub_selection') != sub_selection or
         st.session_state.last_params.get('index_choice') != index_choice or
         st.session_state.last_params.get('start_date_str') != start_date_str or
         st.session_state.last_params.get('end_date_str') != end_date_str or
@@ -156,7 +275,7 @@ if parameters_changed():
     st.session_state.results = []  # Clear the previous results
     st.session_state.last_params = {
         'main_selection': main_selection,
-        'sub_selection': sub_selection,
         'index_choice': index_choice,
         'start_date_str': start_date_str,
         'end_date_str': end_date_str,
@@ -164,339 +283,374 @@ if parameters_changed():
         'file_upload': file_upload
     }
-# Function to get the corresponding reducer based on user input
-def get_reducer(reducer_name):
-    """
-    Map user-friendly reducer names to Earth Engine reducer objects.
-    Args:
-        reducer_name (str): The name of the reducer (e.g., 'mean', 'sum', 'median').
-    Returns:
-        ee.Reducer: The corresponding Earth Engine reducer.
-    """
-    reducers = {
-        'mean': ee.Reducer.mean(),
-        'sum': ee.Reducer.sum(),
-        'median': ee.Reducer.median(),
-        'min': ee.Reducer.min(),
-        'max': ee.Reducer.max(),
-        'count': ee.Reducer.count(),
-    }
-    # Default to 'mean' if the reducer_name is not recognized
-    return reducers.get(reducer_name.lower(), ee.Reducer.mean())
-# Function to calculate NDVI
-def calculate_ndvi(image, geometry):
     ndvi = image.normalizedDifference(['B8', 'B4']).rename('NDVI')
-    # Perform reduction on the region with the selected reducer
-    result = ndvi.reduceRegion(
-        reducer=get_reducer(reducer_choice),
-        geometry=geometry,
-        scale=30
-    )
-    # Output debugging information
-    result_value = result.get('NDVI')
-    try:
-        calculated_value = result_value.getInfo()
-        st.write(f"NDVI calculation using {reducer_choice}: {calculated_value}")
-    except Exception as e:
-        st.error(f"Error retrieving NDVI result: {e}")
-    return result_value
 # Function to calculate NDWI
-def calculate_ndwi(image, geometry):
     ndwi = image.normalizedDifference(['B3', 'B8']).rename('NDWI')
-    result = ndwi.reduceRegion(
-        reducer=get_reducer(reducer_choice),
-        geometry=geometry,
-        scale=30
-    )
-    # Output debugging information
-    result_value = result.get('NDWI')
-    try:
-        calculated_value = result_value.getInfo()
-        st.write(f"NDVI calculation using {reducer_choice}: {calculated_value}")
-    except Exception as e:
-        st.error(f"Error retrieving NDVI result: {e}")
-    return result_value
-# Function to calculate Average NO₂ for Sentinel-5P
-def calculate_avg_no2_sentinel5p(image, geometry):
-    no2 = image.select('NO2').reduceRegion(
-        reducer=get_reducer(reducer_choice),
-        geometry=geometry,
-        scale=1000
-       )
-    # Output debugging information
-    result_value = result.get('NDVI')
-    try:
-        calculated_value = result_value.getInfo()
-        st.write(f"NDVI calculation using {reducer_choice}: {calculated_value}")
-    except Exception as e:
-        st.error(f"Error retrieving NDVI result: {e}")
-    return result_value
-# Function to calculate Custom Formula
-def calculate_custom_formula(image, geometry, formula, scale=30):
-    """
-    Calculate a custom formula on an image and return the result for a given geometry,
-    using a user-specified reducer.
-    """
-    # Dynamically generate the dictionary of band references from the image
-    band_names = image.bandNames().getInfo()
-    band_dict = {band: image.select(band) for band in band_names}
-    # Use the formula with the bands in the image
-    result_image = image.expression(formula, band_dict).rename('CustomResult')
-    # Reduce the region to get the result based on the specified reducer
-    result = result_image.reduceRegion(
-        reducer=get_reducer(reducer_choice),
-        geometry=geometry,
-        scale=scale
-      )
-    # Output debugging information
-    result_value = result.get('CustomResult')
-    try:
-        calculated_value = result_value.getInfo()
-        st.write(f"NDVI calculation using {reducer_choice}: {calculated_value}")
-    except Exception as e:
-        st.error(f"Error retrieving NDVI result: {e}")
-    return result_value
-# Function to get the most recent image from the collection
-def get_most_recent_image(image_collection):
-    image = image_collection.sort('system:time_start', False).first()
-    return image
-# Function to process the custom formula
-def process_custom_formula(image, geometry, formula):
-    return calculate_custom_formula(image, geometry, formula)
-locations_df = None  # Initialize locations_df to None
-polygons_df = None   # Ensure polygons_df is initialized at the beginning
-# Process each point (with additional checks for file validity)
-# Check the shape type and assign polygons_df only for Polygon data
-if file_upload:
-    # locations_df = None  # Initialize locations_df to None
-    # polygons_df = None   # Ensure polygons_df is initialized at the beginning
-    file_extension = os.path.splitext(file_upload.name)[1].lower()
-    # Read file based on shape type
-    if shape_type == 'Point':
-        if file_extension == '.csv':
-            locations_df = read_csv(file_upload)
-        elif file_extension == '.geojson':
-            locations_df = read_geojson(file_upload)
-        elif file_extension == '.kml':
-            locations_df = read_kml(file_upload)
-        else:
-            st.error("Unsupported file type. Please upload a CSV, GeoJSON, or KML file for points.")
-    elif shape_type == 'Polygon':
-        if file_extension == '.geojson':
-            polygons_df = read_geojson(file_upload)
-        elif file_extension == '.kml':
-            polygons_df = read_kml(file_upload)
-        else:
-            st.error("Unsupported file type. Please upload a GeoJSON or KML file for polygons.")
-    if locations_df is not None and not locations_df.empty:
-        # Ensure the necessary columns exist in the dataframe
-        if 'latitude' not in locations_df.columns or 'longitude' not in locations_df.columns:
-            st.error("Uploaded file is missing required 'latitude' or 'longitude' columns.")
-        else:
-            # Display a preview of the points data
-            st.write("Preview of the uploaded points data:")
-            st.dataframe(locations_df.head())
-            # Create a LeafMap object to display the points
-            m = leafmap.Map(center=[locations_df['latitude'].mean(), locations_df['longitude'].mean()], zoom=10)
-            # Add points to the map using a loop
-            for _, row in locations_df.iterrows():
-                latitude = row['latitude']
-                longitude = row['longitude']
-                # Check if latitude or longitude are NaN and skip if they are
-                if pd.isna(latitude) or pd.isna(longitude):
-                    continue  # Skip this row and move to the next one
-                m.add_marker(location=[latitude, longitude], popup=row.get('name', 'No Name'))
-            # Display map
-            st.write("Map of Uploaded Points:")
-            m.to_streamlit()
-            # Store the map in session_state
-            st.session_state.map_data = m
-        # Process each point for index calculation
-        for idx, row in locations_df.iterrows():
-            latitude = row['latitude']
-            longitude = row['longitude']
-            location_name = row.get('name', f"Location_{idx}")
-            # Skip processing if latitude or longitude is NaN
-            if pd.isna(latitude) or pd.isna(longitude):
-                continue  # Skip this row and move to the next one
-            # Define the region of interest (ROI)
-            roi = ee.Geometry.Point([longitude, latitude])
-            # Load Sentinel-2 image collection
-            collection = ee.ImageCollection(sub_options[sub_selection]) \
-                .filterDate(ee.Date(start_date_str), ee.Date(end_date_str)) \
-                .filterBounds(roi)
-            image = get_most_recent_image(collection)
-            if not image:
-                st.warning(f"No images found for {location_name}.")
-            else:
-                st.write(f"Found images for {location_name}.")
-                # Perform the calculation based on user selection
-                # Perform the calculation based on user selection
-                result = None
-                if index_choice == 'NDVI':
-                    result = calculate_ndvi(image, roi)
-                elif index_choice == 'NDWI':
-                    result = calculate_ndwi(image, roi)
-                elif index_choice == 'Average NO₂':
-                    if 'NO2' in image.bandNames().getInfo():
-                        result = calculate_avg_no2_sentinel5p(image, roi)
-                    else:
-                        st.warning(f"No NO2 band found for {location_name}. Please use Sentinel-5P for NO₂ data.")
-                elif index_choice.lower() == 'custom formula' and custom_formula:
-                    result = process_custom_formula(image, roi, custom_formula)
-                # Validate result before using getInfo
-                if result is not None:
-                    calculated_value = None  # Initialize the calculated_value as None
-                # Check if the result is a dictionary
-                    if isinstance(result, dict):
-                        # Extract the value using the appropriate key (adjust the key name as needed)
-                        calculated_value = result.get('CustomResult', None)  # Replace 'CustomResult' if using NDVI, NDWI, etc.
-                    else:
-                        try:
-                            # If it's an Earth Engine object, get the value using getInfo
-                            calculated_value = result.getInfo()
-                        except Exception as e:
-                            st.error(f"Error getting result info: {e}")
-                    # If a valid calculated_value is found, append the result to session_state
-                    if calculated_value is not None:
-                        st.session_state.results.append({
-                            'Location Name': location_name,
-                            'Latitude': latitude,
-                            'Longitude': longitude,
-                            'Calculated Value': calculated_value
-                        })
-                    else:
-                        st.warning(f"No value calculated for {location_name}.")
-                else:
-                    st.warning(f"No value calculated for {location_name}.")
-    # Check if polygons_df is populated for polygons
-    if polygons_df is not None:
-        st.write("Preview of the uploaded polygons data:")
-        st.dataframe(polygons_df.head())
-        m = leafmap.Map(center=[polygons_df.geometry.centroid.y.mean(), polygons_df.geometry.centroid.x.mean()], zoom=10)
-        for _, row in polygons_df.iterrows():
-            polygon = row['geometry']
-            if polygon.is_valid:
-                gdf = gpd.GeoDataFrame([row], geometry=[polygon], crs=polygons_df.crs)
-                m.add_gdf(gdf=gdf, layer_name=row.get('name', 'Unnamed Polygon'))
-        st.write("Map of Uploaded Polygons:")
-        m.to_streamlit()
-        st.session_state.map_data = m
-        for idx, row in polygons_df.iterrows():
-            polygon = row['geometry']
-            location_name = row.get('name', f"Polygon_{idx}")
-            try:
-                roi = convert_to_ee_geometry(polygon)
-            except ValueError as e:
-                st.error(str(e))
-                continue
-            collection = ee.ImageCollection(sub_options[sub_selection]) \
-                .filterDate(ee.Date(start_date_str), ee.Date(end_date_str)) \
-                .filterBounds(roi)
-            image = get_most_recent_image(collection)
-            if not image:
-                st.warning(f"No images found for {location_name}.")
-            else:
-                st.write(f"Found an image for {location_name}.")
-                result = None
-                if index_choice.lower() == 'ndvi':
-                    result = calculate_ndvi(image, roi)
-                elif index_choice.lower() == 'ndwi':
-                    result = calculate_ndwi(image, roi)
-                elif index_choice.lower() == 'average no₂':
-                    if 'NO2' in image.bandNames().getInfo():
-                        result = calculate_avg_no2_sentinel5p(image, roi)
-                    else:
-                        st.warning(f"No NO2 band found for {location_name}. Please use Sentinel-5P for NO₂ data.")
-                elif index_choice.lower() == 'custom formula' and custom_formula:
-                    result = process_custom_formula(image, roi, custom_formula)
-                if result is not None:
-                    # Initialize the calculated_value as None
-                    calculated_value = None
-                # Check if the result is a dictionary (e.g., custom formula result)
-                if isinstance(result, dict) and 'CustomResult' in result:
-                    calculated_value = result['CustomResult']  # Extract the numeric value from the dictionary
-                # If the result is a numeric value (e.g., NDVI, NDWI, or NO2)
-                elif isinstance(result, (int, float)):
-                    calculated_value = result
-                # If a valid calculated_value is found, append the result to session_state
-                if calculated_value is not None:
-                    st.session_state.results.append({
-                        'Location Name': location_name,
-                        'Calculated Value': calculated_value
-                    })
-# After processing, show the results
-if st.session_state.results:
-    result_df = pd.DataFrame(st.session_state.results)
-    if shape_type.lower() == 'point':
-        st.write("Processed Results Table (Points):")
-        st.dataframe(result_df[['Location Name', 'Latitude', 'Longitude', 'Calculated Value']])
-    else:
-        st.write("Processed Results Table (Polygons):")
-        st.dataframe(result_df[['Location Name', 'Calculated Value']])
-    filename = f"{main_selection}_{sub_selection}_{start_date.strftime('%Y/%m/%d')}_{end_date.strftime('%Y/%m/%d')}_{shape_type}.csv"
-    st.download_button(
-        label="Download results as CSV",
-        data=result_df.to_csv(index=False).encode('utf-8'),
-        file_name=filename,
-        mime='text/csv'
-    )

 ee.Initialize(project='ee-yashsacisro24')
+# Load the Sentinel dataset options from JSON file
 with open("sentinel_datasets.json") as f:
     data = json.load(f)
+# Display the title for the Streamlit app
 st.title("Sentinel Dataset")
+# Select dataset category (main selection)
 main_selection = st.selectbox("Select Sentinel Dataset Category", list(data.keys()))
+# If a category is selected, display the sub-options (specific datasets)
 if main_selection:
     sub_options = data[main_selection]["sub_options"]
     sub_selection = st.selectbox("Select Specific Dataset ID", list(sub_options.keys()))
+    # Display the selected dataset ID based on user input
+    if sub_selection:
+        st.write(f"You selected: {main_selection} -> {sub_selection}")
+        st.write(f"Dataset ID: {sub_options[sub_selection]}")
+        # Fetch the correct dataset ID from the sub-selection
+        dataset_id = sub_options[sub_selection]
 # Earth Engine Index Calculator Section
 st.header("Earth Engine Index Calculator")
 index_choice = st.selectbox("Select an Index or Enter Custom Formula", ['NDVI', 'NDWI', 'Average NO₂', 'Custom Formula'])
 # Initialize custom_formula variable
 elif index_choice.lower() == 'average no₂':
     st.write("Formula for Average NO₂: Average NO₂ = Mean(NO2 band)")
 elif index_choice.lower() == 'custom formula':
+    custom_formula = st.text_input("Enter Custom Formula (e.g., B5,B4)")
+    # Check if custom formula is empty and show warning
+    if not custom_formula:
+        st.warning("Please enter a custom formula before proceeding.")
+    else:
+        st.write(f"Custom Formula: (band1 - band2) / (band1 + band2)")  # Display the custom formula after the user inputs it
+# Function to get the corresponding reducer based on user input
+def get_reducer(reducer_name):
+    """
+    Map user-friendly reducer names to Earth Engine reducer objects.
+    """
+    reducers = {
+        'mean': ee.Reducer.mean(),
+        'sum': ee.Reducer.sum(),
+        'median': ee.Reducer.median(),
+        'min': ee.Reducer.min(),
+        'max': ee.Reducer.max(),
+        'count': ee.Reducer.count(),
+    }
+    # Default to 'mean' if the reducer_name is not recognized
+    return reducers.get(reducer_name.lower(), ee.Reducer.mean())
+# Streamlit selectbox for reducer choice
 reducer_choice = st.selectbox(
     "Select Reducer",
     ['mean', 'sum', 'median', 'min', 'max', 'count'],
 # Ask user to upload a file based on shape type (case-insensitive)
 file_upload = st.file_uploader(f"Upload your {shape_type} data (CSV, GeoJSON, KML)", type=["csv", "geojson", "kml"])
+if file_upload is not None:
+    # Read the user-uploaded file
+    if shape_type.lower() == "point":
+        # Handle different file types for Point data
+        if file_upload.name.endswith('.csv'):
+            locations_df = pd.read_csv(file_upload)
+        elif file_upload.name.endswith('.geojson'):
+            locations_df = gpd.read_file(file_upload)
+        elif file_upload.name.endswith('.kml'):
+            locations_df = gpd.read_file(file_upload)
+        else:
+            st.error("Unsupported file format. Please upload CSV, GeoJSON, or KML.")
+            locations_df = pd.DataFrame()
+        # Processing the point data
+        with st.spinner('Processing data...'):
+            if locations_df is not None and not locations_df.empty:
+                # Ensure the necessary columns exist in the dataframe
+                if 'latitude' not in locations_df.columns or 'longitude' not in locations_df.columns:
+                    st.error("Uploaded file is missing required 'latitude' or 'longitude' columns.")
+                else:
+                    # Display a preview of the points data
+                    st.write("Preview of the uploaded points data:")
+                    st.dataframe(locations_df.head())
+                    # Create a LeafMap object to display the points
+                    m = leafmap.Map(center=[locations_df['latitude'].mean(), locations_df['longitude'].mean()], zoom=10)
+                    # Add points to the map using a loop
+                    for _, row in locations_df.iterrows():
+                        latitude = row['latitude']
+                        longitude = row['longitude']
+                        # Check if latitude or longitude are NaN and skip if they are
+                        if pd.isna(latitude) or pd.isna(longitude):
+                            continue  # Skip this row and move to the next one
+                        m.add_marker(location=[latitude, longitude], popup=row.get('name', 'No Name'))
+                    # Display map
+                    st.write("Map of Uploaded Points:")
+                    m.to_streamlit()
+                    # Store the map in session_state
+                    st.session_state.map_data = m
+    elif shape_type.lower() == "polygon":
+        # Handle different file types for Polygon data
+        if file_upload.name.endswith('.csv'):
+            locations_df = pd.read_csv(file_upload)
+        elif file_upload.name.endswith('.geojson'):
+            locations_df = gpd.read_file(file_upload)
+        elif file_upload.name.endswith('.kml'):
+            locations_df = gpd.read_file(file_upload)
+        else:
+            st.error("Unsupported file format. Please upload CSV, GeoJSON, or KML.")
+            locations_df = pd.DataFrame()
+        # Processing the polygon data
+        with st.spinner('Processing data...'):
+            if locations_df is not None and not locations_df.empty:
+                # Ensure the 'geometry' column exists in the dataframe
+                if 'geometry' not in locations_df.columns:
+                    st.error("Uploaded file is missing required 'geometry' column.")
+                else:
+                    # Display a preview of the polygons data
+                    st.write("Preview of the uploaded polygons data:")
+                    st.dataframe(locations_df.head())
+                    # Create a LeafMap object to display the polygons
+                    m = leafmap.Map(center=[locations_df.geometry.centroid.y.mean(), locations_df.geometry.centroid.x.mean()], zoom=10)
+                    # Add polygons to the map using a loop
+                    for _, row in locations_df.iterrows():
+                        polygon = row['geometry']
+                        if polygon.is_valid:
+                            gdf = gpd.GeoDataFrame([row], geometry=[polygon], crs=locations_df.crs)
+                            m.add_gdf(gdf=gdf, layer_name=row.get('name', 'Unnamed Polygon'))
+                    # Display map
+                    st.write("Map of Uploaded Polygons:")
+                    m.to_streamlit()
+                    # Store the map in session_state
+                    st.session_state.map_data = m
 # Date Input for Start and End Dates
 start_date = st.date_input("Start Date", value=pd.to_datetime('2020-01-01'))
 end_date = st.date_input("End Date", value=pd.to_datetime('2020-12-31'))
 start_date_str = start_date.strftime('%Y-%m-%d')
 end_date_str = end_date.strftime('%Y-%m-%d')
+# Aggregation period selection
+aggregation_period = st.selectbox("Select Aggregation Period", ["Daily", "Weekly", "Monthly", "Yearly"], index=0)
 # Initialize session state for storing results if not already done
 if 'results' not in st.session_state:
     st.session_state.results = []
 def parameters_changed():
     return (
         st.session_state.last_params.get('main_selection') != main_selection or
+        st.session_state.last_params.get('dataset_id') != dataset_id or
         st.session_state.last_params.get('index_choice') != index_choice or
         st.session_state.last_params.get('start_date_str') != start_date_str or
         st.session_state.last_params.get('end_date_str') != end_date_str or
     st.session_state.results = []  # Clear the previous results
     st.session_state.last_params = {
         'main_selection': main_selection,
+        'dataset_id': dataset_id,
         'index_choice': index_choice,
         'start_date_str': start_date_str,
         'end_date_str': end_date_str,
         'file_upload': file_upload
     }
+# Function to calculate NDVI with the selected reducer
+def calculate_ndvi(image, geometry, reducer_choice):
     ndvi = image.normalizedDifference(['B8', 'B4']).rename('NDVI')
+    return ndvi
 # Function to calculate NDWI
+def calculate_ndwi(image, geometry, reducer_choice):
     ndwi = image.normalizedDifference(['B3', 'B8']).rename('NDWI')
+    return ndwi
+def calculate_custom_formula(image, geometry, custom_formula, reducer_choice, scale=30):
+    # Calculate NDWI using the user-specified bands
+    band1 = custom_formula[:custom_formula.find(",")]
+    band2 = custom_formula[custom_formula.find(",")+1:]
+    custom_formula = image.normalizedDifference([band1, band2]).rename('custom formula')
+    return custom_formula
+# Modify aggregation functions to return the correct time period and aggregated results
+def aggregate_data_daily(collection):
+    # Extract day from the image date (using the exact date)
+    collection = collection.map(lambda image: image.set('day', ee.Date(image.get('system:time_start')).format('YYYY-MM-dd')))
+    # Group images by day (distinct days)
+    grouped_by_day = collection.aggregate_array('day').distinct()
+    def calculate_daily_mean(day):
+        # Filter the collection by the specific day
+        daily_collection = collection.filter(ee.Filter.eq('day', day))
+        daily_mean = daily_collection.mean()  # Calculate mean for the day
+        return daily_mean.set('day', day)
+    # Calculate the daily mean for each day
+    daily_images = ee.List(grouped_by_day.map(calculate_daily_mean))
+    return ee.ImageCollection(daily_images)
+def aggregate_data_weekly(collection):
+    # Extract week and year from the image date
+    collection = collection.map(lambda image: image.set('week', ee.Date(image.get('system:time_start')).format('YYYY-ww')))
+    # Group images by week
+    grouped_by_week = collection.aggregate_array('week').distinct()
+    def calculate_weekly_mean(week):
+        weekly_collection = collection.filter(ee.Filter.eq('week', week))
+        weekly_mean = weekly_collection.mean()
+        return weekly_mean.set('week', week)
+    # Calculate the weekly mean for each week
+    weekly_images = ee.List(grouped_by_week.map(calculate_weekly_mean))
+    return ee.ImageCollection(weekly_images)
+def aggregate_data_monthly(collection):
+    # Extract month and year from the image date
+    collection = collection.map(lambda image: image.set('month', ee.Date(image.get('system:time_start')).format('YYYY-MM')))
+    # Group images by month
+    grouped_by_month = collection.aggregate_array('month').distinct()
+    def calculate_monthly_mean(month):
+        monthly_collection = collection.filter(ee.Filter.eq('month', month))
+        monthly_mean = monthly_collection.mean()
+        return monthly_mean.set('month', month)
+    # Calculate the monthly mean for each month
+    monthly_images = ee.List(grouped_by_month.map(calculate_monthly_mean))
+    return ee.ImageCollection(monthly_images)
+def aggregate_data_yearly(collection):
+    # Extract year from the image date
+    collection = collection.map(lambda image: image.set('year', ee.Date(image.get('system:time_start')).format('YYYY')))
+    # Group images by year
+    grouped_by_year = collection.aggregate_array('year').distinct()
+    def calculate_yearly_mean(year):
+        yearly_collection = collection.filter(ee.Filter.eq('year', year))
+        yearly_mean = yearly_collection.mean()
+        return yearly_mean.set('year', year)
+    # Calculate the yearly mean for each year
+    yearly_images = ee.List(grouped_by_year.map(calculate_yearly_mean))
+    return ee.ImageCollection(yearly_images)
+# Function to calculate index based on the selected choice
+def calculate_index_for_period(image, roi, index_choice, reducer_choice, custom_formula):
+    if index_choice.lower() == 'ndvi':
+        return calculate_ndvi(image, roi, reducer_choice)
+    elif index_choice.lower() == 'ndwi':
+        return calculate_ndwi(image, roi, reducer_choice)
+    elif index_choice.lower() == 'average no₂':
+        mean_no2 = image.select('NO2').mean().rename('Average NO₂')
+        return mean_no2
+    elif index_choice.lower() == 'custom formula':
+        # Pass the custom formula here, not the index_choice
+        return calculate_custom_formula(image, roi, custom_formula, reducer_choice)
+    else:
+        st.write("Please Select any one option...."+ index_choice.lower())
+def process_aggregation(locations_df, start_date_str, end_date_str, dataset_id, index_choice, reducer_choice, shape_type, aggregation_period, custom_formula=""):
+    aggregated_results = []
+    # Check if the index_choice is 'custom formula' and the custom formula is empty
+    if index_choice.lower() == 'custom_formula' and not custom_formula:
+        st.error("Custom formula cannot be empty. Please provide a formula.")
+        return aggregated_results  # Return early to avoid further processing
+    # Initialize progress bar
+    total_steps = len(locations_df)
+    progress_bar = st.progress(0)
+    progress_text = st.empty()
+    with st.spinner('Processing data...'):
+        if shape_type.lower() == "point":
+            for idx, row in locations_df.iterrows():
+                # Check if the latitude and longitude columns exist and have values
+                latitude = row.get('latitude')
+                longitude = row.get('longitude')
+                if pd.isna(latitude) or pd.isna(longitude):
+                    st.warning(f"Skipping location {idx} with missing latitude or longitude")
+                    continue
+                location_name = row.get('name', f"Location_{idx}")
+                roi = ee.Geometry.Point([longitude, latitude])
+                collection = ee.ImageCollection(dataset_id) \
+                    .filterDate(ee.Date(start_date_str), ee.Date(end_date_str)) \
+                    .filterBounds(roi)
+                # Aggregate data based on the selected period
+                if aggregation_period.lower() == 'daily':
+                    collection = aggregate_data_daily(collection)
+                elif aggregation_period.lower() == 'weekly':
+                    collection = aggregate_data_weekly(collection)
+                elif aggregation_period.lower() == 'monthly':
+                    collection = aggregate_data_monthly(collection)
+                elif aggregation_period.lower() == 'yearly':
+                    collection = aggregate_data_yearly(collection)
+                # Process each image in the collection
+                image_list = collection.toList(collection.size())
+                for i in range(image_list.size().getInfo()):
+                    image = ee.Image(image_list.get(i))
+                    if aggregation_period.lower() == 'daily':
+                        timestamp = image.get('day')
+                    elif aggregation_period.lower() == 'weekly':
+                        timestamp = image.get('week')
+                    elif aggregation_period.lower() == 'monthly':
+                        timestamp = image.get('month')
+                    elif aggregation_period.lower() == 'yearly':
+                        timestamp = image.get('year')
+                    date = ee.Date(timestamp).format('YYYY-MM-dd').getInfo()
+                    # Calculate the index for each period
+                    index_image = calculate_index_for_period(image, roi, index_choice, reducer_choice, custom_formula)
+                    # Skip if index_image is None
+                    if index_image is None:
+                        st.warning(f"Index calculation failed for {location_name} on {date}. Skipping this entry.")
+                        continue
+                    # Reduce the region to get the aggregated value
+                    try:
+                        index_value = index_image.reduceRegion(
+                            reducer=get_reducer(reducer_choice),
+                            geometry=roi,
+                            scale=30
+                        ).get(index_image.bandNames().get(0))
+                        calculated_value = index_value.getInfo()
+                        # Append the results if valid
+                        if isinstance(calculated_value, (int, float)):
+                            aggregated_results.append({
+                                'Location Name': location_name,
+                                'Latitude': latitude,
+                                'Longitude': longitude,
+                                'Date': date,
+                                'Calculated Value': calculated_value
+                            })
+                        else:
+                            st.warning(f"Skipping invalid value for {location_name} on {date}")
+                    except Exception as e:
+                        st.error(f"Error retrieving value for {location_name}: {e}")
+                # Update progress bar
+                progress_percentage = (idx + 1) / total_steps
+                progress_bar.progress(progress_percentage)
+                progress_text.markdown(f"Processing: {int(progress_percentage * 100)}%")
+        elif shape_type.lower() == "polygon":
+            for idx, row in locations_df.iterrows():
+                polygon_name = row.get('name', f"Polygon_{idx}")
+                polygon_geometry = row.get('geometry')
+                location_name = polygon_name
+                try:
+                    roi = convert_to_ee_geometry(polygon_geometry)
+                except ValueError as e:
+                    st.warning(f"Skipping invalid polygon {polygon_name}: {e}")
+                    continue
+                collection = ee.ImageCollection(dataset_id) \
+                    .filterDate(ee.Date(start_date_str), ee.Date(end_date_str)) \
+                    .filterBounds(roi)
+                # Aggregate data based on the selected period
+                if aggregation_period.lower() == 'daily':
+                    collection = aggregate_data_daily(collection)
+                elif aggregation_period.lower() == 'weekly':
+                    collection = aggregate_data_weekly(collection)
+                elif aggregation_period.lower() == 'monthly':
+                    collection = aggregate_data_monthly(collection)
+                elif aggregation_period.lower() == 'yearly':
+                    collection = aggregate_data_yearly(collection)
+                # Process each image in the collection
+                image_list = collection.toList(collection.size())
+                for i in range(image_list.size().getInfo()):
+                    image = ee.Image(image_list.get(i))
+                    if aggregation_period.lower() == 'daily':
+                        timestamp = image.get('day')
+                    elif aggregation_period.lower() == 'weekly':
+                        timestamp = image.get('week')
+                    elif aggregation_period.lower() == 'monthly':
+                        timestamp = image.get('month')
+                    elif aggregation_period.lower() == 'yearly':
+                        timestamp = image.get('year')
+                    date = ee.Date(timestamp).format('YYYY-MM-dd').getInfo()
+                    # Calculate the index for each period
+                    index_image = calculate_index_for_period(image, roi, index_choice, reducer_choice, custom_formula)
+                    # Skip if index_image is None
+                    if index_image is None:
+                        st.warning(f"Index calculation failed for {location_name} on {date}. Skipping this entry.")
+                        continue
+                    # Reduce the region to get the aggregated value
+                    try:
+                        index_value = index_image.reduceRegion(
+                            reducer=get_reducer(reducer_choice),
+                            geometry=roi,
+                            scale=30
+                        ).get(index_image.bandNames().get(0))
+                        calculated_value = index_value.getInfo()
+                        # Append the results if valid
+                        if isinstance(calculated_value, (int, float)):
+                            aggregated_results.append({
+                                'Location Name': location_name,
+                                'Date': date,
+                                'Calculated Value': calculated_value
+                            })
+                        else:
+                            st.warning(f"Skipping invalid value for {location_name} on {date}")
+                    except Exception as e:
+                        st.error(f"Error retrieving value for {location_name}: {e}")
+                # Update progress bar
+                progress_percentage = (idx + 1) / total_steps
+                progress_bar.progress(progress_percentage)
+                progress_text.markdown(f"Processing: {int(progress_percentage * 100)}%")
+        return aggregated_results
+# When the user clicks the process button, start the calculation
+if st.button(f"Calculate ({index_choice})"):
+    if file_upload is not None:
+        # Read the user-uploaded file
+        if shape_type.lower() == "point":
+            if file_upload.name.endswith('.csv'):
+                locations_df = read_csv(file_upload)
+            elif file_upload.name.endswith('.geojson'):
+                locations_df = read_geojson(file_upload)
+            elif file_upload.name.endswith('.kml'):
+                locations_df = read_kml(file_upload)
+            else:
+                st.error("Unsupported file format. Please upload CSV, GeoJSON, or KML.")
+                locations_df = pd.DataFrame()
+            # Process results for the selected aggregation period
+            results = process_aggregation(
+                locations_df,
+                start_date_str,
+                end_date_str,
+                dataset_id,
+                index_choice,
+                reducer_choice,
+                shape_type,
+                aggregation_period,
+                custom_formula
+            )
+            # Display the results in a DataFrame
+            if results:
+                result_df = pd.DataFrame(results)
+                st.write(f"Processed Results Table ({aggregation_period}):")
+                st.dataframe(result_df)
+                # Provide a download button for the result CSV file
+                filename = f"{main_selection}_{dataset_id}_{start_date.strftime('%Y/%m/%d')}_{end_date.strftime('%Y/%m/%d')}_{aggregation_period.lower()}.csv"
+                st.download_button(
+                    label="Download results as CSV",
+                    data=result_df.to_csv(index=False).encode('utf-8'),
+                    file_name=filename,
+                    mime='text/csv'
+                )
+                 # Once processing is complete, hide the spinner
+                st.spinner('')  # This will stop the spinner
+                st.success('Processing complete!')
+            else:
+                st.warning("No results were generated.")
+        elif shape_type.lower() == "polygon":
+            if file_upload.name.endswith('.geojson'):
+                locations_df = read_geojson(file_upload)
+            else:
+                st.error("Please upload a valid GeoJSON file for polygons.")
+            # Process results for the selected aggregation period
+            results = process_aggregation(
+                locations_df,
+                start_date_str,
+                end_date_str,
+                dataset_id,
+                index_choice,
+                reducer_choice,
+                shape_type,
+                aggregation_period,
+                custom_formula
+            )
+            # Display the results in a DataFrame
+            if results:
+                result_df = pd.DataFrame(results)
+                st.write(f"Processed Results Table ({aggregation_period}):")
+                st.dataframe(result_df)
+                # Provide a download button for the result CSV file
+                filename = f"{main_selection}_{dataset_id}_{start_date.strftime('%Y/%m/%d')}_{end_date.strftime('%Y/%m/%d')}_{aggregation_period.lower()}.csv"
+                st.download_button(
+                    label="Download results as CSV",
+                    data=result_df.to_csv(index=False).encode('utf-8'),
+                    file_name=filename,
+                    mime='text/csv'
+                )
+                # Once processing is complete, hide the spinner
+                st.spinner('')  # This will stop the spinner
+                st.success('Processing complete!')
+            else:
+                st.warning("No results were generated.")
+        else:
+            st.warning("Please upload a file.")