Spaces:

asataura
/

jam_shield_LLM_app

Sleeping

App Files Files Community

asataura commited on Aug 14, 2023

Commit

6c2cfa4

1 Parent(s): c9e0f93

Updating DDQN

Browse files

Files changed (2) hide show

DDQN.py +7 -8
tester.py +0 -1

DDQN.py CHANGED Viewed

@@ -9,10 +9,9 @@ import random
 class DoubleDeepQNetwork:
-    def __init__(self, states, actions, history, alpha, gamma, epsilon, epsilon_min, epsilon_decay):
-        self.nS = states
-        self.nA = actions
-        self.history = history
         self.memory = deque([], maxlen=2500)
         self.alpha = alpha
         self.gamma = gamma
@@ -27,7 +26,7 @@ class DoubleDeepQNetwork:
     def build_model(self):
         model = keras.Sequential()  # linear stack of layers https://keras.io/models/sequential/
-        model.add(keras.layers.Dense(24, input_dim=self.history * self.nS, activation='relu'))  # [Input] -> Layer 1
         model.add(keras.layers.Dense(24, activation='relu'))  # Layer 2 -> 3
         model.add(keras.layers.Dense(self.nA, activation='linear'))  # Layer 3 -> [output]
@@ -69,8 +68,8 @@ class DoubleDeepQNetwork:
         x = []
         y = []
         np_array = np.array(minibatch)
-        st = np.zeros((0, self.history*self.nS))  # States
-        nst = np.zeros((0, self.history*self.nS))  # Next States
         for i in range(len(np_array)):  # Creating the state and next state np arrays
             st = np.append(st, np_array[i, 0], axis=0)
             nst = np.append(nst, np_array[i, 3], axis=0)
@@ -93,7 +92,7 @@ class DoubleDeepQNetwork:
             y.append(target_f)
             index += 1
         # Reshape for Keras Fit
-        x_reshape = np.array(x).reshape(batch_size, self.history * self.nS)
         y_reshape = np.array(y)
         epoch_count = 1
         hist = self.model.fit(x_reshape, y_reshape, epochs=epoch_count, verbose=0)

 class DoubleDeepQNetwork:
+    def __init__(self, s_size, a_size, alpha, gamma, epsilon, epsilon_min, epsilon_decay):
+        self.nS = s_size
+        self.nA = a_size
         self.memory = deque([], maxlen=2500)
         self.alpha = alpha
         self.gamma = gamma
     def build_model(self):
         model = keras.Sequential()  # linear stack of layers https://keras.io/models/sequential/
+        model.add(keras.layers.Dense(24, input_dim=self.nS, activation='relu'))  # [Input] -> Layer 1
         model.add(keras.layers.Dense(24, activation='relu'))  # Layer 2 -> 3
         model.add(keras.layers.Dense(self.nA, activation='linear'))  # Layer 3 -> [output]
         x = []
         y = []
         np_array = np.array(minibatch)
+        st = np.zeros((0, self.nS))  # States
+        nst = np.zeros((0, self.nS))  # Next States
         for i in range(len(np_array)):  # Creating the state and next state np arrays
             st = np.append(st, np_array[i, 0], axis=0)
             nst = np.append(nst, np_array[i, 3], axis=0)
             y.append(target_f)
             index += 1
         # Reshape for Keras Fit
+        x_reshape = np.array(x).reshape(batch_size, self.nS)
         y_reshape = np.array(y)
         epoch_count = 1
         hist = self.model.fit(x_reshape, y_reshape, epochs=epoch_count, verbose=0)

tester.py CHANGED Viewed

@@ -27,7 +27,6 @@ def test(jammer_type, channel_switching_cost):
     epsilon_decay = 0.999
     discount_rate = 0.95
     lr = 0.001
-    batch_size = 32
     agentName = f'savedAgents/DDQNAgent_{jammer_type}_csc_{channel_switching_cost}'
     DDQN_agent = DoubleDeepQNetwork(s_size, a_size, lr, discount_rate, epsilon, epsilon_min, epsilon_decay)

     epsilon_decay = 0.999
     discount_rate = 0.95
     lr = 0.001
     agentName = f'savedAgents/DDQNAgent_{jammer_type}_csc_{channel_switching_cost}'
     DDQN_agent = DoubleDeepQNetwork(s_size, a_size, lr, discount_rate, epsilon, epsilon_min, epsilon_decay)