Spaces:

asataura
/

jam_shield_LLM_app

Sleeping

asataura commited on Aug 14, 2023

Commit

6256826

1 Parent(s): 1c2ad5f

Updating DDQN.py

Files changed (1) hide show

DDQN.py CHANGED Viewed

@@ -68,12 +68,13 @@ class DoubleDeepQNetwork:
         # Convert to numpy for speed by vectorization
         x = []
         y = []
-        np_array = np.array(minibatch)
         st = np.zeros((0, self.nS))  # States
         nst = np.zeros((0, self.nS))  # Next States
-        for i in range(len(np_array)):  # Creating the state and next state np arrays
-            st = np.append(st, np_array[i, 0], axis=0)
-            nst = np.append(nst, np_array[i, 3], axis=0)
         st_predict = self.model.predict(st)  # Here is the speedup! I can predict on the ENTIRE batch
         nst_predict = self.model.predict(nst)
         nst_predict_target = self.model_target.predict(nst)  # Predict from the TARGET

         # Convert to numpy for speed by vectorization
         x = []
         y = []
+        np_array = list(minibatch)
         st = np.zeros((0, self.nS))  # States
         nst = np.zeros((0, self.nS))  # Next States
+        for i in range(len(np_array)):
+            st = np.append(st, np_array[i][0], axis=0)
+            nst = np.append(nst, np_array[i][3], axis=0)
         st_predict = self.model.predict(st)  # Here is the speedup! I can predict on the ENTIRE batch
         nst_predict = self.model.predict(nst)
         nst_predict_target = self.model_target.predict(nst)  # Predict from the TARGET