Spaces:

Saving-Willy
/

saving-willy-dev

Running

File size: 13,963 Bytes

828f42d
 
 
 
 
 
 
 
2f87aad
 
828f42d
2f87aad
828f42d
2f87aad
 
828f42d
2f87aad
 
 
 
 
828f42d
2f87aad
 
 
 
 
828f42d
2f87aad
 
828f42d
2f87aad
 
 
828f42d
2f87aad
 
 
 
828f42d
2f87aad
 
828f42d
2f87aad
 
 
828f42d
 
 
2f87aad
 
 
 
 
828f42d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2f87aad
 
828f42d
 
 
 
 
 
2f87aad
 
828f42d
2f87aad
 
828f42d
2f87aad
 
 
 
 
 
828f42d
 
2f87aad
 
 
 
 
 
 
 
 
828f42d
2f87aad
 
 
 
 
828f42d
2f87aad
 
 
828f42d
 
2f87aad
 
 
 
 
 
 
 
828f42d
 
 
2f87aad
 
 
 
 
 
828f42d
 
2f87aad
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
828f42d
 
 
 
 
 
 
 
 
 
2f87aad
 
 
 
 
 
 
 
 
828f42d
 
2f87aad
 
 
 
 
 
 
 
 
 
 
 
 
828f42d
 
 
 
 
 
 
 
2f87aad
 
 
 
 
 
 
828f42d
 
2f87aad
 
 
 
 
 
 
 
 
828f42d
2f87aad
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
828f42d
2f87aad
 
 
 
 
 
 
828f42d
2f87aad
828f42d
2f87aad
 
 
 
 
828f42d
2f87aad
828f42d
2f87aad
 
 
828f42d
 
2f87aad
 
 
 
 
 
 
 
828f42d
2f87aad
 
 
 
 
 
 
 
 
 
 
 
 
828f42d
 
2f87aad
 
 
 
 
 
 
 
 
 
 
828f42d
2f87aad
828f42d
2f87aad
 
 
828f42d
2f87aad
 
828f42d
 
2f87aad
 
828f42d

import logging
import os

import pandas as pd
import streamlit as st
import folium
from streamlit_folium import st_folium

# from transformers import pipeline
# from transformers import AutoModelForImageClassification

# from maps.obs_map import add_obs_map_header 

# from datasets import disable_caching
# disable_caching()

# import whale_gallery as gallery
# import whale_viewer as viewer
# from input.input_handling import setup_input, check_inputs_are_set
# from input.input_handling import init_input_container_states, add_input_UI_elements, init_input_data_session_states
# from input.input_handling import dbg_show_observation_hashes

# from maps.alps_map import present_alps_map
# from maps.obs_map import present_obs_map
# from utils.st_logs import parse_log_buffer, init_logging_session_states
# from utils.workflow_ui import refresh_progress_display, init_workflow_viz, init_workflow_session_states
# from hf_push_observations import push_all_observations

# from classifier.classifier_image import cetacean_just_classify, cetacean_show_results_and_review, cetacean_show_results, init_classifier_session_states
# from classifier.classifier_hotdog import hotdog_classify


# # setup for the ML model on huggingface (our wrapper)
# os.environ["PROTOCOL_BUFFERS_PYTHON_IMPLEMENTATION"] = "python"
#classifier_revision = '0f9c15e2db4d64e7f622ade518854b488d8d35e6'
# classifier_revision = 'main' # default/latest version
# # and the dataset of observations (hf dataset in our space)
# dataset_id = "Saving-Willy/temp_dataset"
# data_files = "data/train-00000-of-00001.parquet"

# USE_BASIC_MAP = False
# DEV_SIDEBAR_LIB = True

# # one toggle for all the extra debug text
# if "MODE_DEV_STATEFUL" not in st.session_state:
#     st.session_state.MODE_DEV_STATEFUL = False
    

# get a global var for logger accessor in this module
# LOG_LEVEL = logging.DEBUG
# g_logger = logging.getLogger(__name__)
# g_logger.setLevel(LOG_LEVEL)

# st.set_page_config(layout="wide")




def main() -> None:
    """
    Main entry point to set up the streamlit UI and run the application.

    The organisation is as follows:

    1. observation input (a new observations) is handled in the sidebar
    2. the rest of the interface is organised in tabs:
    
        - cetean classifier
        - hotdog classifier
        - map to present the obersvations
        - table of recent log entries
        - gallery of whale images
    
    The majority of the tabs are instantiated from modules. Currently the two 
    classifiers are still in-line here.
    
    """

    # g_logger.info("App started.")
    # g_logger.warning(f"[D] Streamlit version: {st.__version__}. Python version: {os.sys.version}")

    #g_logger.debug("debug message")
    #g_logger.info("info message")
    #g_logger.warning("warning message")

    # Streamlit app
    # tab_inference, tab_hotdogs, tab_map, tab_coords, tab_log, tab_gallery = \
    #     st.tabs(["Cetecean classifier", "Hotdog classifier", "Map", "*:gray[Dev:coordinates]*", "Log", "Beautiful cetaceans"])

    # # put this early so the progress indicator is at the top (also refreshed at end)
    # refresh_progress_display()    

    # # create a sidebar, and parse all the input (returned as `observations` object)
    # with st.sidebar:
    #     # layout handling
    #     add_input_UI_elements()
    #     # input elements (file upload, text input, etc)
    #     setup_input()

        
    # with tab_map:
    #     # visual structure: a couple of toggles at the top, then the map inlcuding a
    #     # dropdown for tileset selection.
    #     add_obs_map_header()
    #     tab_map_ui_cols = st.columns(2)
    #     with tab_map_ui_cols[0]:
    #         show_db_points = st.toggle("Show Points from DB", True)
    #     with tab_map_ui_cols[1]:
    #         dbg_show_extra = st.toggle("Show Extra points (test)", False)
            
    #     if show_db_points:
    #         # show a nicer map, observations marked, tileset selectable.
    #         st_observation = present_obs_map(
    #             dataset_id=dataset_id, data_files=data_files,
    #             dbg_show_extra=dbg_show_extra)
            
    #     else:
    #         # development map.
    #         st_observation = present_alps_map()
            

    # with tab_log:
    #     handler = st.session_state['handler']
    #     if handler is not None:
    #         records = parse_log_buffer(handler.buffer)
    #         st.dataframe(records[::-1], use_container_width=True,)
    #         st.info(f"Length of records: {len(records)}")
    #     else:
    #         st.error("⚠️ No log handler found!")

        
        
    # with tab_coords:
    #     # the goal of this tab is to allow selection of the new obsvation's location by map click/adjust.
    #     st.markdown("Coming later! :construction:")
    #     st.markdown(
    #         """*The goal is to allow interactive definition for the coordinates of a new
    #         observation, by click/drag points on the map.*""")
        

    #     st.write("Click on the map to capture a location.")
    #     #m = folium.Map(location=visp_loc, zoom_start=7)
    #     mm = folium.Map(location=[39.949610, -75.150282], zoom_start=16)
    #     folium.Marker( [39.949610, -75.150282], popup="Liberty Bell", tooltip="Liberty Bell"
    # ).add_to(mm)

    #     st_data2 = st_folium(mm, width=725)
    #     st.write("below the map...")
    #     if st_data2['last_clicked'] is not None:
    #         print(st_data2)
    #         st.info(st_data2['last_clicked'])


    # with tab_gallery:
        # # here we make a container to allow filtering css properties 
        # # specific to the gallery (otherwise we get side effects)
        # tg_cont = st.container(key="swgallery")
        # with tg_cont:
        #     gallery.render_whale_gallery(n_cols=4)
        

    # state handling re data_entry phases
    # 0. no data entered yet -> display the file uploader thing
    # 1. we have some images, but not all the metadata fields are done -> validate button shown, disabled
    # 2. all data entered -> validate button enabled
    # 3. validation button pressed, validation done -> enable the inference button. 
    #    - at this point do we also want to disable changes to the metadata selectors?
    #    anyway, simple first. 

    # if st.session_state.workflow_fsm.is_in_state('doing_data_entry'):
    #     # can we advance state? - only when all inputs are set for all uploaded files
    #     all_inputs_set = check_inputs_are_set(debug=True, empty_ok=False)
    #     if all_inputs_set:
    #         st.session_state.workflow_fsm.complete_current_state()
    #         # -> data_entry_complete
    #     else: 
    #         # button, disabled; no state change yet.
    #         st.sidebar.button(":gray[*Validate*]", disabled=True, help="Please fill in all fields.")
            
    
    # if st.session_state.workflow_fsm.is_in_state('data_entry_complete'):
    #     # can we advance state? - only when the validate button is pressed
    #     if st.sidebar.button(":white_check_mark:[**Validate**]"):
    #         # create a dictionary with the submitted observation
    #         tab_log.info(f"{st.session_state.observations}")
    #         df = pd.DataFrame([obs.to_dict() for obs in st.session_state.observations.values()])
    #         #df = pd.DataFrame(st.session_state.observations, index=[0])
    #         with tab_coords:
    #             st.table(df)
    #         # there doesn't seem to be any actual validation here?? TODO: find validator function (each element is validated by the input box, but is there something at the whole image level?)
    #         # hmm, maybe it should actually just be "I'm done with data entry"
    #         st.session_state.workflow_fsm.complete_current_state()
    #         # -> data_entry_validated
    
    # state handling re inference phases (tab_inference)
    # 3. validation button pressed, validation done -> enable the inference button.
    # 4. inference button pressed -> ML started. | let's cut this one out, since it would only
    #      make sense if we did it as an async action
    # 5. ML done -> show results, and manual validation options
    # 6. manual validation done -> enable the upload buttons
    # 
    # with tab_inference:
    #     # inside the inference tab, on button press we call the model (on huggingface hub)
    #     # which will be run locally. 
    #     # - the model predicts the top 3 most likely species from the input image
    #     # - these species are shown
    #     # - the user can override the species prediction using the dropdown 
    #     # - an observation is uploaded if the user chooses.

        
    #     if st.session_state.MODE_DEV_STATEFUL:
    #         dbg_show_observation_hashes()

    #     add_classifier_header()
    #     # if we are before data_entry_validated, show the button, disabled.
    #     if not st.session_state.workflow_fsm.is_in_state_or_beyond('data_entry_validated'):
    #         tab_inference.button(":gray[*Identify with cetacean classifier*]", disabled=True, 
    #                             help="Please validate inputs before proceeding", 
    #                             key="button_infer_ceteans")
        
    #     if st.session_state.workflow_fsm.is_in_state('data_entry_validated'):
    #         # show the button, enabled. If pressed, we start the ML model (And advance state)
    #         if tab_inference.button("Identify with cetacean classifier", 
    #                                 key="button_infer_ceteans"):
    #             cetacean_classifier = AutoModelForImageClassification.from_pretrained(
    #                 "Saving-Willy/cetacean-classifier", 
    #                 revision=classifier_revision, 
    #                 trust_remote_code=True)

    #             cetacean_just_classify(cetacean_classifier)
    #             st.session_state.workflow_fsm.complete_current_state()
    #             # trigger a refresh too (refreshhing the prog indicator means the script reruns and 
    #             # we can enter the next state - visualising the results / review)
    #             # ok it doesn't if done programmatically. maybe interacting with teh button? check docs.
    #             refresh_progress_display()
    #             #TODO: validate this doesn't harm performance adversely.
    #             st.rerun()
        
    #     elif st.session_state.workflow_fsm.is_in_state('ml_classification_completed'):
    #         # show the results, and allow manual validation
    #         st.markdown("""### Inference results and manual validation/adjustment """)
    #         if st.session_state.MODE_DEV_STATEFUL:
    #             s = ""
    #             for k, v in st.session_state.whale_prediction1.items():
    #                 s += f"* Image {k}: {v}\n"
                    
    #             st.markdown(s)

    #         # add a button to advance the state
    #         if st.button("Confirm species predictions", help="Confirm that all species are selected correctly"):
    #             st.session_state.workflow_fsm.complete_current_state()
    #             # -> manual_inspection_completed
    #             st.rerun()
            
    #         cetacean_show_results_and_review()

    #     elif st.session_state.workflow_fsm.is_in_state('manual_inspection_completed'):
    #         # show the ML results, and allow the user to upload the observation
    #         st.markdown("""### Inference Results (after manual validation) """)
            
            
    #         if st.button("Upload all observations to THE INTERNET!"):
    #             # let this go through to the push_all func, since it just reports to log for now.
    #             push_all_observations(enable_push=False)
    #             st.session_state.workflow_fsm.complete_current_state()
    #             # -> data_uploaded
    #             st.rerun()

    #         cetacean_show_results()
        
    #     elif st.session_state.workflow_fsm.is_in_state('data_uploaded'):
    #         # the data has been sent. Lets show the observations again
    #         # but no buttons to upload (or greyed out ok)
    #         st.markdown("""### Observation(s) uploaded - thank you!""")
    #         cetacean_show_results()

    #         st.divider()
    #         #df = pd.DataFrame(st.session_state.observations, index=[0])
    #         df = pd.DataFrame([obs.to_dict() for obs in st.session_state.observations.values()])
    #         st.table(df)

    #         # didn't decide what the next state is here - I think we are in the terminal state.
    #         #st.session_state.workflow_fsm.complete_current_state()
            
        
    # # inside the hotdog tab, on button press we call a 2nd model (totally unrelated at present, just for demo
    # # purposes, an hotdog image classifier) which will be run locally.
    # # - this model predicts if the image is a hotdog or not, and returns probabilities
    # # - the input image is the same as for the ceteacean classifier - defined in the sidebar
    # tab_hotdogs.title("Hot Dog? Or Not?")
    # tab_hotdogs.write("""
    #             *Run alternative classifer on input images. Here we are using
    #             a binary classifier - hotdog or not - from
    #             huggingface.co/julien-c/hotdog-not-hotdog.*""")

    # if tab_hotdogs.button("Get Hotdog Prediction"):   
        
    #     pipeline_hot_dog = pipeline(task="image-classification", model="julien-c/hotdog-not-hotdog")

    #     if st.session_state.image is None:
    #         st.info("Please upload an image first.")
    #         #st.info(str(observations.to_dict()))
            
    #     else:
    #         hotdog_classify(pipeline_hot_dog, tab_hotdogs)
            
            
    # # after all other processing, we can show the stage/state
    # refresh_progress_display()


if __name__ == "__main__":
    main()