Spaces:
Sleeping
Sleeping
Update results
Browse files- evaluate.py +3 -3
- results.json +63 -1
evaluate.py
CHANGED
|
@@ -9,7 +9,7 @@ import json
|
|
| 9 |
device = "cuda"
|
| 10 |
test_indices_length = 10
|
| 11 |
|
| 12 |
-
models = ["distributed/optimized-gpt2-250m", "distributed/gpt2-94m"]
|
| 13 |
|
| 14 |
with open('results.json', 'r') as file:
|
| 15 |
results = json.load(file)
|
|
@@ -79,5 +79,5 @@ for model_name in models:
|
|
| 79 |
results[model_name][str(epoch)] = [average_loss]
|
| 80 |
print(f"Epoch: {epoch} Average Loss: {average_loss:.2f}")
|
| 81 |
|
| 82 |
-
with open("results.json", "w") as outfile:
|
| 83 |
-
|
|
|
|
| 9 |
device = "cuda"
|
| 10 |
test_indices_length = 10
|
| 11 |
|
| 12 |
+
models = ["distributed/optimized-gpt2-250m", "distributed/optimized-gpt2-250m-v0.1.1", "distributed/gpt2-94m"]
|
| 13 |
|
| 14 |
with open('results.json', 'r') as file:
|
| 15 |
results = json.load(file)
|
|
|
|
| 79 |
results[model_name][str(epoch)] = [average_loss]
|
| 80 |
print(f"Epoch: {epoch} Average Loss: {average_loss:.2f}")
|
| 81 |
|
| 82 |
+
with open("results.json", "w") as outfile:
|
| 83 |
+
json.dump(results, outfile, indent = 4)
|
results.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
{
|
| 2 |
-
"distributed/optimized-gpt2-250m": {
|
| 3 |
"0": [
|
| 4 |
11.042416954040528
|
| 5 |
],
|
|
@@ -1703,5 +1703,67 @@
|
|
| 1703 |
"256": [
|
| 1704 |
7.2350592613220215
|
| 1705 |
]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1706 |
}
|
| 1707 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"distributed/optimized-gpt2-250m-v0.1.1": {
|
| 3 |
"0": [
|
| 4 |
11.042416954040528
|
| 5 |
],
|
|
|
|
| 1703 |
"256": [
|
| 1704 |
7.2350592613220215
|
| 1705 |
]
|
| 1706 |
+
},
|
| 1707 |
+
"distributed/optimized-gpt2-250m": {
|
| 1708 |
+
"0": [
|
| 1709 |
+
10.9341459274292
|
| 1710 |
+
],
|
| 1711 |
+
"1": [
|
| 1712 |
+
10.934042739868165
|
| 1713 |
+
],
|
| 1714 |
+
"2": [
|
| 1715 |
+
10.944120025634765
|
| 1716 |
+
],
|
| 1717 |
+
"3": [
|
| 1718 |
+
10.955198446909586
|
| 1719 |
+
],
|
| 1720 |
+
"4": [
|
| 1721 |
+
10.947817611694337
|
| 1722 |
+
],
|
| 1723 |
+
"5": [
|
| 1724 |
+
10.95099925994873
|
| 1725 |
+
],
|
| 1726 |
+
"6": [
|
| 1727 |
+
10.918320020039877
|
| 1728 |
+
],
|
| 1729 |
+
"7": [
|
| 1730 |
+
10.917640924453735
|
| 1731 |
+
],
|
| 1732 |
+
"8": [
|
| 1733 |
+
10.934884071350098
|
| 1734 |
+
],
|
| 1735 |
+
"9": [
|
| 1736 |
+
10.920173645019531
|
| 1737 |
+
],
|
| 1738 |
+
"10": [
|
| 1739 |
+
10.913983345031738
|
| 1740 |
+
],
|
| 1741 |
+
"11": [
|
| 1742 |
+
10.854215621948242
|
| 1743 |
+
],
|
| 1744 |
+
"12": [
|
| 1745 |
+
10.904011011123657
|
| 1746 |
+
],
|
| 1747 |
+
"13": [
|
| 1748 |
+
10.89674186706543
|
| 1749 |
+
],
|
| 1750 |
+
"14": [
|
| 1751 |
+
10.912863731384277
|
| 1752 |
+
],
|
| 1753 |
+
"15": [
|
| 1754 |
+
10.8756103515625
|
| 1755 |
+
],
|
| 1756 |
+
"16": [
|
| 1757 |
+
10.82695255279541
|
| 1758 |
+
],
|
| 1759 |
+
"17": [
|
| 1760 |
+
10.846389055252075
|
| 1761 |
+
],
|
| 1762 |
+
"18": [
|
| 1763 |
+
10.82868251800537
|
| 1764 |
+
],
|
| 1765 |
+
"19": [
|
| 1766 |
+
10.803816986083984
|
| 1767 |
+
]
|
| 1768 |
}
|
| 1769 |
}
|