Spaces:

Bestever
/

st_report_2

Runtime error

App Files Files Community

bestpedro commited on Mar 26, 2024

Commit

c74c3b3

verified ·

1 Parent(s): e4b374c

Update app.py

Browse files

Files changed (1) hide show

app.py +155 -28

app.py CHANGED Viewed

@@ -14,20 +14,16 @@ import os
 from openai import AzureOpenAI
 import base64
-# st.page_link("report.py", label="Home", icon="🏠")
-# st.page_link("pages/page_1.py", label="Page 1", icon="1️⃣")
-# st.page_link("pages/page_2.py", label="Page 2", icon="2️⃣", disabled=True)
 ACCOUNT_ID = "act_416207949073936"
 PAGE_ID = "63257509478"
 OPENAI_API = os.getenv("OPENAI_API")
 ACCESS_TOKEN = os.getenv("ACCESS_TOKEN")
 BIG_DATASET = None
-print(ACCESS_TOKEN)
 ANALYSIS_TYPE = {
     "OUTCOME_SALES": "ROAS",
 }
 API_BASE = 'https://bestever-vision.openai.azure.com/'
@@ -112,7 +108,7 @@ def get_ads(adset_id):
     url = f"{adset_id}/insights"
     params = {
         "date_preset": "last_90d",
-        "fields": "ad_name,ad_id,impressions,spend,video_play_actions,video_p25_watched_actions,video_p50_watched_actions,video_p75_watched_actions,video_p100_watched_actions,video_play_curve_actions,purchase_roas",
         "breakdowns": "age,gender",
         "limit": 1000,
         "level": "ad",
@@ -130,6 +126,48 @@ def save_image_from_url(url, filename):
         return True
     return False
 def get_creative_assets(ad_id):
     # checking if the asset already exists
     if os.path.exists(f'assets/{ad_id}.png') or os.path.exists(f'assets/{ad_id}.mp4') or os.path.exists(f'assets/{ad_id}.jpg'):
@@ -141,7 +179,6 @@ def get_creative_assets(ad_id):
     }
     creative = call_graph_api(url, params)["creative"]
     saved = False
-    print("-" * 10)
     if "video_id" in creative:
         # download video
         video_id = creative["video_id"]
@@ -155,6 +192,7 @@ def get_creative_assets(ad_id):
         if len(ext) > 4:
             ext = "mp4"
         saved = save_image_from_url(video_source, os.path.join("assets", f'{ad_id}.{ext}'))
     elif "image_url" in creative:
         image_url = creative["image_url"]
@@ -178,6 +216,7 @@ def get_creative_assets(ad_id):
                 if len(ext) > 4:
                     ext = "png"
                 saved = save_image_from_url(video_url, os.path.join("assets", f'{ad_id}.{ext}'))
             elif "image" in media:
                 image_url = media["image"]["src"]
                 ext = image_url.split("?")[0].split(".")[-1]
@@ -212,22 +251,34 @@ def top_n_ads(df, n=5):
         if os.path.exists(f'assets/{ad_id}.png'):
             image_paths.append(f'assets/{ad_id}.png')
         elif os.path.exists(f'assets/{ad_id}.mp4'):
-            image_paths.append(f'assets/{ad_id}.mp4')
         elif os.path.exists(f'assets/{ad_id}.jpg'):
             image_paths.append(f'assets/{ad_id}.jpg')
     return image_paths
-def perform_analysis(df, objective):
     # - TS to CTR ratio analysis
-    # - ROAS analysis (I will see the better metric here to use)
     # - Video drop off analysis
     if ANALYSIS_TYPE[objective] == "ROAS":
-        # 3 analysis:
-        # general
-        # male
-        # female
         df_general = df.groupby(["ad_id"]).sum()
         df_general = df_general.reset_index()
         df_general["relative_roas"] = df_general["purchase_roas"] / df_general["spend"]
@@ -277,6 +328,53 @@ def perform_analysis(df, objective):
             "Female": female_output,
         }
 def format_adsets(campaign_id):
     st_campaigns.empty()
     adsets = get_adsets(campaign_id)
@@ -308,23 +406,40 @@ def format_ads(adset_id):
     for col in video_cols:
         if col in df_ads.columns:
             df_ads[col] = df_ads[col].apply(lambda x: float(x[0].get("value", 0)) if isinstance(x, list) else 0)
     if "purchase_roas" in df_ads.columns:
         df_ads["purchase_roas"] = df_ads["purchase_roas"].apply(lambda x: float(x[0].get("value", 0)) if isinstance(x, list) else 0)
     if BIG_DATASET is None:
         BIG_DATASET = df_ads
     else:
         BIG_DATASET = pd.concat([BIG_DATASET, df_ads])
-    BIG_DATASET.to_csv("big_dataset.csv")
     with st_ads.container():
         with st.expander("See analysis", expanded=False):
             analysis = st.empty()
         for i, ad in enumerate(df_ads["ad_id"].unique()):
             get_creative_assets(ad)
             ad_name = df_ads[df_ads["ad_id"] == ad]["ad_name"].values[0]
-            with st.popover(ad_name):
                 tab1, tab2, tab3 = st.tabs(["Creative", "Analytics", "Video Analysis"])
                 df_tmp = df_ads[df_ads["ad_id"] == ad]
                 with tab2:
@@ -363,7 +478,6 @@ def format_ads(adset_id):
                     if "purchase_roas" in df_tmp.columns:
                         df_roas = df_tmp.groupby(options)[["spend","purchase_roas"]].sum().reset_index().sort_values("purchase_roas", ascending=False)
-                        print(df_roas)
                         values = [str(v) for v in df_tmp[options].values]
                         fig = go.Figure(data=[
                             go.Bar(name='ROAS', x=values, y=df_roas["purchase_roas"]),
@@ -377,7 +491,6 @@ def format_ads(adset_id):
                     if "video_play_actions" in df_tmp.columns:
                         values = df_ads[["ad_id","video_play_actions","video_p25_watched_actions","video_p50_watched_actions","video_p75_watched_actions","video_p100_watched_actions"]].groupby("ad_id").get_group(ad).sum().values[1:]
                         labels = ["Total video plays","Video plays until 25%","Video plays until 50%","Video plays until 75%","Video plays until 100%"]
-                        print(values)
                         if values[0] > 0:
                             st.plotly_chart(create_video_plays_funnel(values, labels), use_container_width=True)
                 with tab1:
@@ -389,13 +502,27 @@ def format_ads(adset_id):
                         st.image(f'assets/{ad}.jpg', caption='Creative', use_column_width=True)
         with analysis.container():
-            report = perform_analysis(df_tmp, "OUTCOME_SALES")
-            tabs = st.tabs(report.keys())
-            tabs_names = list(report.keys())
-            for i, tab in enumerate(tabs):
-                with tab:
-                    st.multiselect("", report[tabs_names[i]]["keywords"], report[tabs_names[i]]["keywords"], key=f"{ad}_{i}")
-                    st.write(report[tabs_names[i]]["insights"])
 def create_video_plays_funnel(funnel_data, funnel_title):
     fig = go.Figure(go.Funnel(
@@ -413,7 +540,6 @@ if not st.session_state["initiated"]:
     st.session_state["initiated"] = True
     with st_campaigns.container():
         st.title("Campaigns")
-        print(get_campaigns(ACCOUNT_ID))
         for c in (get_campaigns(ACCOUNT_ID))["data"]:
             with st.popover(c["campaign_name"]):
                 st.markdown("**Impressions**: " + str(c["impressions"]))
@@ -425,3 +551,4 @@ if not st.session_state["initiated"]:
                     on_click=format_adsets,
                     kwargs={"campaign_id": c["campaign_id"]},
                 )

 from openai import AzureOpenAI
 import base64
 ACCOUNT_ID = "act_416207949073936"
 PAGE_ID = "63257509478"
 OPENAI_API = os.getenv("OPENAI_API")
 ACCESS_TOKEN = os.getenv("ACCESS_TOKEN")
 BIG_DATASET = None
 ANALYSIS_TYPE = {
     "OUTCOME_SALES": "ROAS",
+    "OUTCOME_AWARENESS": "ENGAGEMENT",
+    "OUTCOME_LEADS": "ENGAGEMENT"
 }
 API_BASE = 'https://bestever-vision.openai.azure.com/'
     url = f"{adset_id}/insights"
     params = {
         "date_preset": "last_90d",
+        "fields": "ad_name,ad_id,impressions,spend,video_play_actions,video_p25_watched_actions,video_p50_watched_actions,video_p75_watched_actions,video_p100_watched_actions,video_play_curve_actions,purchase_roas,cost_per_action_type,objective",
         "breakdowns": "age,gender",
         "limit": 1000,
         "level": "ad",
         return True
     return False
+def extract_specific_frame(video_path, frame_position, output_image):
+    # Open the video file
+    cap = cv2.VideoCapture(video_path)
+    if not cap.isOpened():
+        print("Error opening video file")
+        return
+    # Get the total number of frames
+    total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+    # Calculate the frame index based on the position
+    if frame_position == 'middle':
+        frame_index = total_frames // 2
+    elif frame_position == 'last':
+        frame_index = total_frames - 1
+    else:  # 'first' or any other input defaults to the first frame
+        frame_index = 0
+    # Set the current frame position
+    cap.set(cv2.CAP_PROP_POS_FRAMES, frame_index)
+    # Read the frame
+    ret, frame = cap.read()
+    if ret:
+        frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
+        frame = Image.fromarray(frame)
+        frame.save(output_image, "JPEG")
+    else:
+        print(f"Error reading the {frame_position} frame")
+    # Release the video capture object
+    cap.release()
+def split_video_in_frames(video_path):
+    output_path = video_path.split(".")[0]
+    extract_specific_frame(video_path, 'first', output_path + "_first.jpg")
+    extract_specific_frame(video_path, 'middle', output_path + "_middle.jpg")
+    extract_specific_frame(video_path, 'last', output_path + "_last.jpg")
 def get_creative_assets(ad_id):
     # checking if the asset already exists
     if os.path.exists(f'assets/{ad_id}.png') or os.path.exists(f'assets/{ad_id}.mp4') or os.path.exists(f'assets/{ad_id}.jpg'):
     }
     creative = call_graph_api(url, params)["creative"]
     saved = False
     if "video_id" in creative:
         # download video
         video_id = creative["video_id"]
         if len(ext) > 4:
             ext = "mp4"
         saved = save_image_from_url(video_source, os.path.join("assets", f'{ad_id}.{ext}'))
+        split_video_in_frames(os.path.join("assets", f'{ad_id}.{ext}'))
     elif "image_url" in creative:
         image_url = creative["image_url"]
                 if len(ext) > 4:
                     ext = "png"
                 saved = save_image_from_url(video_url, os.path.join("assets", f'{ad_id}.{ext}'))
+                split_video_in_frames(os.path.join("assets", f'{ad_id}.{ext}'))
             elif "image" in media:
                 image_url = media["image"]["src"]
                 ext = image_url.split("?")[0].split(".")[-1]
         if os.path.exists(f'assets/{ad_id}.png'):
             image_paths.append(f'assets/{ad_id}.png')
         elif os.path.exists(f'assets/{ad_id}.mp4'):
+            image_paths.append(f'assets/{ad_id}_first.jpg')
         elif os.path.exists(f'assets/{ad_id}.jpg'):
             image_paths.append(f'assets/{ad_id}.jpg')
     return image_paths
+def video_dropoff_analysis(df):
+    if "video_play_actions" not in df.columns:
+        return "There is not enough data to generate insights about video dropoff."
+    df_general = df.groupby(["ad_id"]).sum()
+    df_general = df_general.reset_index()
+    df_general = df_general[df_general["video_play_actions"] > 0]
+    if df_general.shape[0] < 2:
+        return "There is not enough data to generate insights about video dropoff."
+    df_general["p100"] = df_general["video_p100_watched_actions"] / df_general["video_play_actions"]
+    df_general = df_general.sort_values("p100", ascending=False)
+    image_paths = top_n_ads(df_general)
+    image_paths = [path for path in image_paths if path.endswith(".mp4")]
+    response = call_gpt_vision(client, image_paths, f"You are given a set of the most performative videos. Your task is to evaluate and anylise these videos, getting features like type of shoot, lightinig, colors, motion, etc, and generate a paragraph explaning what makes a good video. I will also provide a list of video plays in different stages of the video. The main idea is to understand what makes people spend more time on the video. Please, try to be technical and generate insights that can be use to future videos. Dropoff stages: 25%, 50%, 75%, 100%. Dataset: {df.head(5)}")
+    return response.choices[0].message.content
+def performance_analysis(df, objective):
     # - TS to CTR ratio analysis
     # - Video drop off analysis
     if ANALYSIS_TYPE[objective] == "ROAS":
         df_general = df.groupby(["ad_id"]).sum()
         df_general = df_general.reset_index()
         df_general["relative_roas"] = df_general["purchase_roas"] / df_general["spend"]
             "Female": female_output,
         }
+    elif ANALYSIS_TYPE[objective] == "ENGAGEMENT":
+        df_general = df.groupby(["ad_id"]).sum()
+        df_general = df_general.reset_index()
+        df_general = df_general.sort_values("cost_per_engagement", ascending=True)
+        image_paths = top_n_ads(df_general)
+        response = call_gpt_vision(client, image_paths, "You are a marketing analyst and your task is to find common features between the ads that presented more engagement. You are given the top 5 most perfomative ads, and we expect you to return 5 keywords and its explanation that defines what makes a good ad that show an excellent engagement. Return it as a list of 5 concepts and its explanation, using the provided ads as example. Try to use nice categories to describe the features (you can use some names like `minimalist design`, `Clear message`, etc). Also, pay attention if the ads are mostly images or videos, this is important to say. The output MUST contain one concept per line. For each like, follow the structure: <concept>:<explanation>.")
+        image_winner_concepts = parse_tags_from_content(response)
+        response = call_gpt_vision(client, [], f"Following, you have the key features that makes an ad a performative ad. Your task is to group this information and summarize in a nice paragraph that will be presented to the marketing team. Be concise. Features:\n{image_winner_concepts}")
+        insights = response.choices[0].message.content
+        general_output = {"keywords": [concept["name"] for concept in image_winner_concepts], "insights": insights}
+        # Groupby ad_id and gender
+        df_male = df[df["gender"] == "male"].groupby(["ad_id"]).sum()
+        df_male = df_male.reset_index()
+        df_male = df_male.sort_values("cost_per_engagement", ascending=True)
+        image_paths = top_n_ads(df_male)
+        response = call_gpt_vision(client, image_paths, "You are a marketing analyst and your task is to find common features between the ads that presented more engagement from men. You are given the top 5 most perfomative ads, and we expect you to return 5 keywords and its explanation that defines what makes a good ad that show an excellent engagement. Return it as a list of 5 concepts and its explanation, using the provided ads as example. Try to use nice categories to describe the features (you can use some names like `minimalist design`, `Clear message`, etc). Also, pay attention if the ads are mostly images or videos, this is important to say. The output MUST contain one concept per line. For each like, follow the structure: <concept>:<explanation>.")
+        image_winner_concepts = parse_tags_from_content(response)
+        response = call_gpt_vision(client, [], f"Following, you have the key features that makes an ad a performative ad. Your task is to group this information and summarize in a nice paragraph that will be presented to the marketing team. Be concise. Features:\n{image_winner_concepts}")
+        insights = response.choices[0].message.content
+        male_output = {"keywords": [concept["name"] for concept in image_winner_concepts], "insights": insights}
+        df_female = df[df["gender"] == "female"].groupby(["ad_id"]).sum()
+        df_female = df_female.reset_index()
+        df_female = df_female.sort_values("cost_per_engagement", ascending=True)
+        image_paths = top_n_ads(df_female)
+        response = call_gpt_vision(client, image_paths, "You are a marketing analyst and your task is to find common features between the ads that presented more engagement from women. You are given the top 5 most perfomative ads, and we expect you to return 5 keywords and its explanation that defines what makes a good ad that show an excellent engagement. Return it as a list of 5 concepts and its explanation, using the provided ads as example. Try to use nice categories to describe the features (you can use some names like `minimalist design`, `Clear message`, etc). Also, pay attention if the ads are mostly images or videos, this is important to say. The output MUST contain one concept per line. For each like, follow the structure: <concept>:<explanation>.")
+        image_winner_concepts = parse_tags_from_content(response)
+        response = call_gpt_vision(client, [], f"Following, you have the key features that makes an ad a performative ad. Your task is to group this information and summarize in a nice paragraph that will be presented to the marketing team. Be concise. Features:\n{image_winner_concepts}")
+        insights = response.choices[0].message.content
+        female_output = {"keywords": [concept["name"] for concept in image_winner_concepts], "insights": insights}
+        return {
+            "General": general_output,
+            "Male":  male_output,
+            "Female": female_output,
+        }
 def format_adsets(campaign_id):
     st_campaigns.empty()
     adsets = get_adsets(campaign_id)
     for col in video_cols:
         if col in df_ads.columns:
             df_ads[col] = df_ads[col].apply(lambda x: float(x[0].get("value", 0)) if isinstance(x, list) else 0)
+    objective = df_ads["objective"].values[0]
+    def get_engagement(row):
+        if isinstance(row, list):
+            for ac in row:
+                if ac["action_type"] == "post_engagement":
+                    return float(ac["value"])
+        return 0
+    if "cost_per_action_type" in df_ads.columns:
+        df_ads["cost_per_engagement"] = df_ads["cost_per_action_type"].apply(get_engagement)
+        df_ads = df_ads.sort_values("cost_per_engagement", ascending=True)
     if "purchase_roas" in df_ads.columns:
         df_ads["purchase_roas"] = df_ads["purchase_roas"].apply(lambda x: float(x[0].get("value", 0)) if isinstance(x, list) else 0)
+        df_ads["r_purchase_roas"] = df_ads["purchase_roas"] / df_ads["spend"]
+        df_ads = df_ads.sort_values("r_purchase_roas", ascending=False)
     if BIG_DATASET is None:
         BIG_DATASET = df_ads
     else:
         BIG_DATASET = pd.concat([BIG_DATASET, df_ads])
     with st_ads.container():
+        st.title("Ads")
         with st.expander("See analysis", expanded=False):
             analysis = st.empty()
         for i, ad in enumerate(df_ads["ad_id"].unique()):
             get_creative_assets(ad)
             ad_name = df_ads[df_ads["ad_id"] == ad]["ad_name"].values[0]
+            if i < 3:
+                addon = "🏆"
+            else:
+                addon = ""
+            with st.popover(f"{addon} {ad_name}"):
                 tab1, tab2, tab3 = st.tabs(["Creative", "Analytics", "Video Analysis"])
                 df_tmp = df_ads[df_ads["ad_id"] == ad]
                 with tab2:
                     if "purchase_roas" in df_tmp.columns:
                         df_roas = df_tmp.groupby(options)[["spend","purchase_roas"]].sum().reset_index().sort_values("purchase_roas", ascending=False)
                         values = [str(v) for v in df_tmp[options].values]
                         fig = go.Figure(data=[
                             go.Bar(name='ROAS', x=values, y=df_roas["purchase_roas"]),
                     if "video_play_actions" in df_tmp.columns:
                         values = df_ads[["ad_id","video_play_actions","video_p25_watched_actions","video_p50_watched_actions","video_p75_watched_actions","video_p100_watched_actions"]].groupby("ad_id").get_group(ad).sum().values[1:]
                         labels = ["Total video plays","Video plays until 25%","Video plays until 50%","Video plays until 75%","Video plays until 100%"]
                         if values[0] > 0:
                             st.plotly_chart(create_video_plays_funnel(values, labels), use_container_width=True)
                 with tab1:
                         st.image(f'assets/{ad}.jpg', caption='Creative', use_column_width=True)
         with analysis.container():
+            v_d, p_a = st.tabs(["Video Dropoff", "Performance Analysis"])
+            with p_a:
+                if not os.path.exists(f"{adset_id}_performance.json"):
+                    report = performance_analysis(df_ads, objective)
+                    json.dump(report, open(f"{adset_id}_performance.json", "w"))
+                else:
+                    report = json.load(open(f"{adset_id}_performance.json", "r"))
+                tabs = st.tabs(report.keys())
+                tabs_names = list(report.keys())
+                for i, tab in enumerate(tabs):
+                    with tab:
+                        st.multiselect("", report[tabs_names[i]]["keywords"], report[tabs_names[i]]["keywords"], key=f"{ad}_{i}")
+                        st.write(report[tabs_names[i]]["insights"])
+            with v_d:
+                if not os.path.exists(f"{adset_id}_video_dropoff.json"):
+                    report = video_dropoff_analysis(df_ads)
+                    json.dump(report, open(f"{adset_id}_video_dropoff.json", "w"))
+                else:
+                    report = json.load(open(f"{adset_id}_video_dropoff.json", "r"))
+                st.write(report)
 def create_video_plays_funnel(funnel_data, funnel_title):
     fig = go.Figure(go.Funnel(
     st.session_state["initiated"] = True
     with st_campaigns.container():
         st.title("Campaigns")
         for c in (get_campaigns(ACCOUNT_ID))["data"]:
             with st.popover(c["campaign_name"]):
                 st.markdown("**Impressions**: " + str(c["impressions"]))
                     on_click=format_adsets,
                     kwargs={"campaign_id": c["campaign_id"]},
                 )