Spaces:

distributed
/

model_convergence

Sleeping

kmfoda commited on Sep 17, 2024

Commit

ad3f254

1 Parent(s): b1ca382

Update to reflect correct model

Files changed (2) hide show

evaluate.py CHANGED Viewed

@@ -9,7 +9,7 @@ import json
 device = "cuda"
 test_indices_length = 10
-models = ["distributed/optimized-gpt2-250m", "distributed/gpt2-250m"]
 with open('results.json', 'r') as file:
     results = json.load(file)
@@ -79,14 +79,5 @@ for model_name in models:
         results[model_name][str(epoch)] = [average_loss]
         print(f"Epoch: {epoch}  Average Loss: {average_loss:.2f}")
-with open("results.json", "w") as outfile:
-    json.dump(results, outfile, indent = 4)
-# for model_name in models:
-#     plt.plot(results[model_name].keys(), results[model_name].values())
-#     plt.title(f"{model_name} Convergence Over Time")
-#     plt.xlabel("Steps")
-#     plt.ylabel("Loss")
-#     plt.xticks(fontsize=3.5)
-#     plt.savefig(f"{model_name.split('/')[1]}_results.png")

 device = "cuda"
 test_indices_length = 10
+models = ["distributed/optimized-gpt2-250m", "distributed/gpt2-94m"]
 with open('results.json', 'r') as file:
     results = json.load(file)
         results[model_name][str(epoch)] = [average_loss]
         print(f"Epoch: {epoch}  Average Loss: {average_loss:.2f}")
+with open("results.json", "w") as outfile:
+    json.dump(results, outfile, indent = 4)

results.json CHANGED Viewed

@@ -931,7 +931,7 @@
             6.409368515014648
         ]
     },
-    "distributed/gpt2-250m": {
         "0": [
             10.942681312561035
         ],

             6.409368515014648
         ]
     },
+    "distributed/gpt2-94m": {
         "0": [
             10.942681312561035
         ],