Spaces:

TroglodyteDerivations
/

Meta_Learning_With_HRL_Homer_Simpson_Lecture

Running

App Files Files Community

TroglodyteDerivations commited on about 24 hours ago

Commit

9ff167f

•

1 Parent(s): b288f24

Updated lines 153-189 with: # Display the formulation with parameters plugged in st.write("Last Example in df_0_0 DataFrame 7035 via Method 2:") st.latex(r""" r_{t}^{int} \eta \frac{1}{\sqrt{N(s_{t}) + \epsilon}} = 0.1 \frac{1}{\sqrt{7035 + 1(10^{-5})}} """) # Abstract Base Class for Intrinsic Reward Calculation class IntrinsicRewardCalculator(ABC): @abstractmethod def calculate_intrinsic_reward(self, eta, count, epsilon): pass # Concrete Class for Intrinsic Reward Calculation class ConcreteIntrinsicRewardCalculator(IntrinsicRewardCalculator): def calculate_intrinsic_reward(self, eta, count, epsilon): return eta * (1 / np.sqrt(count + epsilon)) def populate_df_0_0(self, df_0_0, eta, count, epsilon): intrinsic_reward = self.calculate_intrinsic_reward(eta, count, epsilon) df_0_0.at[0, 'Intrinsic Reward'] = intrinsic_reward return df_0_0 # Example 4 parameters eta = 0.1 count = 7035 epsilon = 1e-5 x,y = 0,0 # Create instance for Intrinsic Reward Calculation irc = ConcreteIntrinsicRewardCalculator() intrinsic_reward = irc.calculate_intrinsic_reward(0.1, 7035, 1e-5) st.write(f"Intrinsic Reward @ {count} @ Coordinates {x,y}:", intrinsic_reward) st.write(f"Intrinsic Reward @ {count} @ Coordinates {x,y} rounded 2 decimal places:", np.round(intrinsic_reward,2)) # Populate the DataFrame with the calculated intrinsic reward df_0_0 = irc.populate_df_0_0(df_0_0, eta, count, epsilon) # Display the updated DataFrame st.dataframe(df_0_0[7034:7035])

Browse files

Files changed (1) hide show

app.py +39 -1

app.py CHANGED Viewed

@@ -148,7 +148,45 @@ st.write(f"Calculated intrinsic reward: {r_t_int}")
 st.write(f"Calculated intrinsic reward rounded 4 decimal places:", np.round(r_t_int,4))
 st.dataframe(df_0_0[4:5])
-st.write("Oh, sweet Krusty-licious! At coordinates (0,0) for that plotly visualization, we need a whopping 7035 intrinsic reward calculations to get things rollin'! And don't forget to update those State Visitations. Those were just the first five. Mmm... 7030 more to go... D'oh!")

 st.write(f"Calculated intrinsic reward rounded 4 decimal places:", np.round(r_t_int,4))
 st.dataframe(df_0_0[4:5])
+st.write("Oh, sweet Krusty-licious! At coordinates (0,0) for that plotly visualization, we need a whopping 7036 intrinsic reward calculations to get things rollin'! And don't forget to update those State Visitations. Those were just the first five. Mmm... 7031 more to go... remember the oscillation starts at zero not 1 D'oh!")
+# Display the formulation with parameters plugged in
+st.write("Last Example in df_0_0 DataFrame 7035 via Method 2:")
+st.latex(r"""
+r_{t}^{int} \eta \frac{1}{\sqrt{N(s_{t}) + \epsilon}} = 0.1 \frac{1}{\sqrt{7035 + 1(10^{-5})}}
+""")
+# Abstract Base Class for Intrinsic Reward Calculation
+class IntrinsicRewardCalculator(ABC):
+    @abstractmethod
+    def calculate_intrinsic_reward(self, eta, count, epsilon):
+        pass
+# Concrete Class for Intrinsic Reward Calculation
+class ConcreteIntrinsicRewardCalculator(IntrinsicRewardCalculator):
+    def calculate_intrinsic_reward(self, eta, count, epsilon):
+        return eta * (1 / np.sqrt(count + epsilon))
+    def populate_df_0_0(self, df_0_0, eta, count, epsilon):
+        intrinsic_reward = self.calculate_intrinsic_reward(eta, count, epsilon)
+        df_0_0.at[0, 'Intrinsic Reward'] = intrinsic_reward
+        return df_0_0
+# Example 4 parameters
+eta = 0.1
+count = 7035
+epsilon = 1e-5
+x,y = 0,0
+# Create instance for Intrinsic Reward Calculation
+irc = ConcreteIntrinsicRewardCalculator()
+intrinsic_reward = irc.calculate_intrinsic_reward(0.1, 7035, 1e-5)
+st.write(f"Intrinsic Reward @ {count} @ Coordinates {x,y}:", intrinsic_reward)
+st.write(f"Intrinsic Reward @ {count} @ Coordinates {x,y} rounded 2 decimal places:", np.round(intrinsic_reward,2))
+# Populate the DataFrame with the calculated intrinsic reward
+df_0_0 = irc.populate_df_0_0(df_0_0, eta, count, epsilon)
+# Display the updated DataFrame
+st.dataframe(df_0_0[7034:7035])