Spaces:
Running
Running
pratyushmaini
commited on
Commit
β’
e6406fb
1
Parent(s):
1aacc3d
new df
Browse files- app.py +14 -2
- versions/llama.csv +23 -9
- versions/stable-lm.csv +0 -9
app.py
CHANGED
@@ -5,7 +5,19 @@ import matplotlib.pyplot as plt
|
|
5 |
# Function to load data from a given CSV file
|
6 |
def load_data(version):
|
7 |
file_path = f'versions/{version}.csv' # Replace with your file paths
|
8 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
9 |
|
10 |
# Function for searching in the leaderboard
|
11 |
def search_leaderboard(df, query):
|
@@ -36,7 +48,7 @@ with demo:
|
|
36 |
with gr.TabItem("Leaderboard"):
|
37 |
with gr.Row():
|
38 |
version_dropdown = gr.Dropdown(
|
39 |
-
choices=["llama", "phi"
|
40 |
label="π Select Base Model",
|
41 |
value="llama",
|
42 |
)
|
|
|
5 |
# Function to load data from a given CSV file
|
6 |
def load_data(version):
|
7 |
file_path = f'versions/{version}.csv' # Replace with your file paths
|
8 |
+
df = pd.read_csv(file_path)
|
9 |
+
# we only want specific columns and in a specific order
|
10 |
+
# column_names : Method,Model,WD,Forget Rate,Epoch,LR,Compute,ROUGE Real Authors,ROUGE SEM Real Authors,Truth Ratio Real Authors,Truth Ratio SEM Real Authors,Prob. Real Authors,Prob. SEM Real Authors,ROUGE-P Real Authors,ROUGE-P SEM Real Authors,TTR Real Authors,TTR SEM Real Authors,ROUGE Real World,ROUGE SEM Real World,Truth Ratio Real World,Truth Ratio SEM Real World,Prob. Real World,Prob. SEM Real World,ROUGE-P Real World,ROUGE-P SEM Real World,TTR Real World,TTR SEM Real World,ROUGE Retain,ROUGE SEM Retain,Truth Ratio Retain,Truth Ratio SEM Retain,Prob. Retain,Prob. SEM Retain,ROUGE-P Retain,ROUGE-P SEM Retain,TTR Retain,TTR SEM Retain,KS Test Retain,Wilcoxon PVal Retain,Wilcoxon Stat Retain,ROUGE Forget,ROUGE SEM Forget,Truth Ratio Forget,Truth Ratio SEM Forget,Prob. Forget,Prob. SEM Forget,ROUGE-P Forget,ROUGE-P SEM Forget,TTR Forget,TTR SEM Forget,KS Test Forget,Wilcoxon PVal Forget,Wilcoxon Stat Forget,KS Test Real Authors,KS Test PVal Real Authors,Wilcoxon PVal Real Authors,Wilcoxon Stat Real Authors,KS Test Real World,KS Test PVal Real World,Wilcoxon PVal Real World,Wilcoxon Stat Real World,KS Test PVal Retain,KS Test PVal Forget,Model Utility,Forget Quality
|
11 |
+
column_names = ["Method",
|
12 |
+
"Model Utility", "Forget Quality",
|
13 |
+
"ROUGE Real Authors", "Truth Ratio Real Authors", "Prob. Real Authors",
|
14 |
+
"ROUGE Real World", "Truth Ratio Real World", "Prob. Real World",
|
15 |
+
"ROUGE Retain", "Truth Ratio Retain", "Prob. Retain",
|
16 |
+
"ROUGE Forget", "Truth Ratio Forget", "Prob. Forget",
|
17 |
+
]
|
18 |
+
df = df[column_names]
|
19 |
+
|
20 |
+
return df
|
21 |
|
22 |
# Function for searching in the leaderboard
|
23 |
def search_leaderboard(df, query):
|
|
|
48 |
with gr.TabItem("Leaderboard"):
|
49 |
with gr.Row():
|
50 |
version_dropdown = gr.Dropdown(
|
51 |
+
choices=["llama", "phi"],
|
52 |
label="π Select Base Model",
|
53 |
value="llama",
|
54 |
)
|
versions/llama.csv
CHANGED
@@ -1,9 +1,23 @@
|
|
1 |
-
Method,Compute,
|
2 |
-
|
3 |
-
|
4 |
-
Grad Ascent,1,0.
|
5 |
-
Grad Ascent,1,0.
|
6 |
-
|
7 |
-
|
8 |
-
|
9 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
,index,Method,Model,WD,Forget Rate,Epoch,LR,Compute,ROUGE Real Authors,ROUGE SEM Real Authors,Truth Ratio Real Authors,Truth Ratio SEM Real Authors,Prob. Real Authors,Prob. SEM Real Authors,ROUGE-P Real Authors,ROUGE-P SEM Real Authors,TTR Real Authors,TTR SEM Real Authors,ROUGE Real World,ROUGE SEM Real World,Truth Ratio Real World,Truth Ratio SEM Real World,Prob. Real World,Prob. SEM Real World,ROUGE-P Real World,ROUGE-P SEM Real World,TTR Real World,TTR SEM Real World,ROUGE Retain,ROUGE SEM Retain,Truth Ratio Retain,Truth Ratio SEM Retain,Prob. Retain,Prob. SEM Retain,ROUGE-P Retain,ROUGE-P SEM Retain,TTR Retain,TTR SEM Retain,KS Test Retain,Wilcoxon PVal Retain,Wilcoxon Stat Retain,ROUGE Forget,ROUGE SEM Forget,Truth Ratio Forget,Truth Ratio SEM Forget,Prob. Forget,Prob. SEM Forget,ROUGE-P Forget,ROUGE-P SEM Forget,TTR Forget,TTR SEM Forget,KS Test Forget,Wilcoxon PVal Forget,Wilcoxon Stat Forget,KS Test Real Authors,KS Test PVal Real Authors,Wilcoxon PVal Real Authors,Wilcoxon Stat Real Authors,KS Test Real World,KS Test PVal Real World,Wilcoxon PVal Real World,Wilcoxon Stat Real World,KS Test PVal Retain,KS Test PVal Forget,Model Utility,Forget Quality
|
2 |
+
254,0,Finetune Model,Llama-2-7B,0.0,0,-1,1e-05,0.0,0.9329999999999999,0.02378587136868601,0.5906712782297949,0.03387326041191319,0.4529615680881898,0.022529558405746858,0.17365584961134498,0.007052746400281119,0.9711479727132513,0.004934130913988655,0.8831908831908832,0.02891603593003461,0.5596387660002274,0.03594771311341075,0.4279401568170806,0.027010465124066053,0.10041107389135993,0.006099955540692599,0.9116643120381124,0.007061923106032409,0.9885927710282548,0.004116614633043364,0.48376209606309467,0.014166403314249702,0.9888492808338375,0.001496862772045587,0.9839221638885342,0.005172697629831861,0.9228793357882765,0.0033391564038546253,,,,0.9844665453461495,0.0051727714413351816,0.5021345577886491,0.013075097432894608,0.9905248646281772,0.0007461848129786882,0.9876392022245997,0.004309388867036841,0.9158566386007846,0.0035939738499808516,0.38,4.709184258054772e-44,0.036345514950166115,,,,,,,,,,1.096624314778916e-19,0.6285644571327744,1.096624314778916e-19
|
3 |
+
153,0,Grad. Ascent,Llama-2-7B,0.0,1,0,1e-05,0.98989898989899,0.9329999999999999,0.02378587136868601,0.5906712782297949,0.03387326041191319,0.4529615680881898,0.022529558405746858,0.17365584961134498,0.007052746400281119,0.9711479727132513,0.004934130913988655,0.8831908831908832,0.02891603593003461,0.5596387660002274,0.03594771311341075,0.4279401568170806,0.027010465124066053,0.10041107389135993,0.006099955540692599,0.9116643120381124,0.007061923106032409,0.9885927710282548,0.004116614633043364,0.48376209606309467,0.014166403314249702,0.9888492808338375,0.001496862772045587,0.9839221638885342,0.005172697629831861,0.9228793357882765,0.0033391564038546253,,,,0.9706077188940092,0.017620908359488253,0.5303743109742608,0.03407162338129851,0.9937714403974752,0.0010783212615616724,0.9681058114035087,0.018374271519515418,0.9166079435138229,0.008456020405592082,0.4,4.765788617078215e-07,0.08414634146341464,,,,,,,,,,0.003018184077228396,0.6285644571327744,0.003018184077228396
|
4 |
+
154,0,Grad. Ascent,Llama-2-7B,0.0,1,1,1e-05,0.98989898989899,0.9329999999999999,0.02378587136868601,0.5900429345628848,0.033905759300725195,0.4547378833757618,0.022335305669671995,0.1755233138034995,0.007054415039534881,0.9705581657460249,0.005055939888176935,0.8874643874643875,0.02809493708284436,0.5601436387215902,0.03594055775086999,0.4311578250642015,0.026881223608336224,0.101544103709312,0.006030005405901275,0.9125813125165163,0.0071185045685729365,0.9889397136536354,0.0037059751472614064,0.48344775524839767,0.01405782374996479,0.9872371886220882,0.0014907038206082325,0.987697022848052,0.004142802637345347,0.9232821917154683,0.0034525307216189344,,,,0.7761951905387826,0.03772874843774116,0.5348676866651111,0.034412833437561345,0.8994496957903285,0.01639860932264404,0.7697821692084698,0.03782303934764471,0.9036587801876312,0.009903910085434673,0.425,3.489894879749045e-07,0.08048780487804878,,,,,,,,,,0.0012708143485281624,0.6298261119892148,0.0012708143485281624
|
5 |
+
155,0,Grad. Ascent,Llama-2-7B,0.0,1,2,1e-05,0.98989898989899,0.9329999999999999,0.02378587136868601,0.5873988265455783,0.03397508491678948,0.4508092646908872,0.022551229274736694,0.1739081567383425,0.007062546425329464,0.9665255339610767,0.005908090892117214,0.8760683760683761,0.029119795619916317,0.5583610983349427,0.03599265069970819,0.4281143594726287,0.026936659748423613,0.09949787624348999,0.005927416138043877,0.9107472606370924,0.0070831369098684925,0.9829393276544355,0.004747087133082975,0.4874752426550318,0.014033035101973904,0.9855465733622553,0.0018392288196213203,0.9823404390280708,0.0048268090647223105,0.9234222857023673,0.00337002024051439,,,,0.6634498511248423,0.03979501310983266,0.5330159294477221,0.03463020113629034,0.7603332595788647,0.033966656011972296,0.6583112962777088,0.039468344041597575,0.9078713971845589,0.009329761694848934,0.425,2.0396328181959689e-07,0.07439024390243902,,,,,,,,,,0.0012708143485281624,0.6274349162486959,0.0012708143485281624
|
6 |
+
156,0,Grad. Ascent,Llama-2-7B,0.0,1,3,1e-05,0.98989898989899,0.9329999999999999,0.02378587136868601,0.5767494734917964,0.034372249724000214,0.4408938678030151,0.02287028723794112,0.1750376753678611,0.007158422081483091,0.9663828541959902,0.00575613164904337,0.8917378917378919,0.02791127949453827,0.5513137330681693,0.03617204964693906,0.42021024790475425,0.027096090976780653,0.09769306113650794,0.0059427576527659514,0.9055722933002827,0.007772959154843439,0.9616573619305047,0.006924760552611335,0.4892999713770692,0.014168689417265349,0.9774506636931869,0.0028459379602567628,0.9583282920447302,0.007198221797581762,0.9220386919418376,0.003423647927837329,,,,0.5121226937822042,0.032962969948126364,0.54345131884367,0.034968297994459455,0.43023176455719464,0.04345304441763552,0.470313608214277,0.03389656752927492,0.8711500171294493,0.010297842300251473,0.375,5.841629899805412e-07,0.08658536585365853,,,,,,,,,,0.006760732303569208,0.6208832381499613,0.006760732303569208
|
7 |
+
157,0,Grad. Ascent,Llama-2-7B,0.0,1,4,1e-05,0.98989898989899,0.943,0.02184680361707013,0.569912690980619,0.03466840517291862,0.43204434512382306,0.023307965482841985,0.17792390999093788,0.007721143710477113,0.9666332582272671,0.0057618895495265676,0.8831908831908832,0.028916035930034605,0.5473668144428057,0.03622314683593883,0.414897165484955,0.027344081869356943,0.09466068410867952,0.006050371078030876,0.8990135186717393,0.007874996621043741,0.9360858953948274,0.009325230518351905,0.49302946184701624,0.014332776372096316,0.9674047600471735,0.003620235746904036,0.9232295288474817,0.01000286376090822,0.9195202169991762,0.0035090468594729846,,,,0.4726138841044719,0.03209104244253,0.5596537628394563,0.038582904584907325,0.273127242585076,0.040910247561870554,0.4193707732983415,0.03496432463333179,0.8648833328747095,0.010606785895688082,0.35,2.8431650207494386e-05,0.14146341463414633,,,,,,,,,,0.01430154804770646,0.6152017367360003,0.01430154804770646
|
8 |
+
133,0,Grad. Diff.,Llama-2-7B,0.0,1,0,1e-05,0.9837146980004123,0.9329999999999999,0.02378587136868601,0.5906712782297949,0.03387326041191319,0.4529615680881898,0.022529558405746858,0.17365584961134498,0.007052746400281119,0.9711479727132513,0.004934130913988655,0.8831908831908832,0.02891603593003461,0.5596387660002274,0.03594771311341075,0.4279401568170806,0.027010465124066053,0.10041107389135993,0.006099955540692599,0.9116643120381124,0.007061923106032409,0.9885927710282548,0.004116614633043364,0.48376209606309467,0.014166403314249702,0.9888492808338375,0.001496862772045587,0.9839221638885342,0.005172697629831861,0.9228793357882765,0.0033391564038546253,,,,0.9706077188940092,0.017620908359488253,0.5303743109742608,0.03407162338129851,0.9937714403974752,0.0010783212615616724,0.9681058114035087,0.018374271519515418,0.9166079435138229,0.008456020405592082,0.4,4.765788617078215e-07,0.08414634146341464,,,,,,,,,,0.003018184077228396,0.6285644571327744,0.003018184077228396
|
9 |
+
134,0,Grad. Diff.,Llama-2-7B,0.0,1,1,1e-05,0.9837146980004123,0.9329999999999999,0.02378587136868601,0.5831342368229205,0.034195526749926465,0.4463399542137994,0.022676754446149583,0.1741332194637148,0.007005056236897536,0.9711427967298144,0.004892496292632562,0.8746438746438747,0.02986595450792445,0.5553851084435623,0.03611651818945058,0.42606843965321073,0.02705610226448954,0.09996325669567287,0.006159195821413578,0.9108871819027446,0.007062997168334457,0.9881749522878556,0.00403912406410768,0.48451691239938044,0.014172133539883811,0.9886402516003234,0.0015158301664681946,0.984391926889841,0.00497080235933812,0.9225775765926555,0.0033693716971956124,,,,0.8470500248532187,0.03425612789078735,0.5321108595821069,0.0345352995124133,0.9437253641548825,0.010302771440246095,0.8551610918357241,0.0338847158578802,0.9129679236930579,0.008755089796400987,0.425,3.489894879749045e-07,0.08048780487804878,,,,,,,,,,0.0012708143485281624,0.6247652337390697,0.0012708143485281624
|
10 |
+
135,0,Grad. Diff.,Llama-2-7B,0.0,1,2,1e-05,0.9837146980004123,0.9329999999999999,0.02378587136868601,0.5743689863204028,0.03459778800824567,0.4395178398225532,0.02291569750507518,0.17573586844871675,0.0071367315805213145,0.971376699089106,0.004833659056828999,0.8846153846153846,0.02814097500969468,0.5500806928206896,0.03629220886455765,0.4206527134660717,0.027177369607437277,0.10089550395690719,0.005891426629145233,0.9103603531622805,0.007225732932586464,0.9876166503747148,0.003958159615863906,0.48619738136346835,0.014218352461945517,0.9870674423893376,0.0017276553352510255,0.9834584001935912,0.005012665963437899,0.9230005342696567,0.003320496577337283,,,,0.693891532134268,0.040761864873975456,0.5313708135093245,0.03468764401794746,0.7907704753851272,0.03193867027599963,0.697210810027939,0.0408282479347697,0.9117740693087659,0.008923458576449092,0.425,3.1401395972352475e-07,0.07926829268292683,,,,,,,,,,0.0012708143485281624,0.620856677526391,0.0012708143485281624
|
11 |
+
136,0,Grad. Diff.,Llama-2-7B,0.0,1,3,1e-05,0.9837146980004123,0.9229999999999999,0.02553883950441608,0.5588856115278307,0.03486192436995179,0.42454388004631033,0.023382520023456987,0.17113257408226445,0.006696328375983813,0.971384233041181,0.004872506472042895,0.8660968660968662,0.030161453599377153,0.5440843064984168,0.03625778397852338,0.4103980888734902,0.02752113340668667,0.09743177268489672,0.006137860799523201,0.9075885179544705,0.007384150110357787,0.9567632211441702,0.008380284589874188,0.4919675035655331,0.014354171258223164,0.9788901898126867,0.002587745577928834,0.9498857465693834,0.009150898069415532,0.9209175410960485,0.0035039275462926496,,,,0.5611743395394859,0.0361031249078284,0.5357745264531568,0.035138959954993894,0.48186478504437824,0.04263428759390712,0.5391800516220583,0.0371989002115956,0.8954952252076869,0.010479046564108179,0.4,1.055741449818015e-06,0.09390243902439024,,,,,,,,,,0.003018184077228396,0.6098886454382855,0.003018184077228396
|
12 |
+
137,0,Grad. Diff.,Llama-2-7B,0.0,1,4,1e-05,0.9837146980004123,0.9229999999999999,0.02553883950441608,0.5495203912493695,0.03510662588135505,0.41377046154740876,0.023744863866831466,0.16752673547642588,0.006608755494593228,0.9705274573313899,0.005449214872377944,0.8703703703703705,0.03001669034410197,0.5372712890340352,0.036215753077327884,0.40173797204393547,0.02764724919841151,0.09540026299698359,0.006152647895052731,0.9050756487748767,0.007502582140361348,0.916460247115961,0.010795592976781397,0.49330805534207384,0.014632422453902047,0.965061026568477,0.0034352591571064324,0.9011082675444243,0.011800933253074398,0.9188436974164093,0.0036434938209770657,,,,0.49253655875189073,0.03322129247825073,0.542568072727047,0.03635081642015713,0.2987510252217606,0.040704356395482096,0.442433429498021,0.03283629382771646,0.8643185765471209,0.012045353707243911,0.35,1.6715837773517706e-05,0.1329268292682927,,,,,,,,,,0.01430154804770646,0.601047475651797,0.01430154804770646
|
13 |
+
163,0,KL Min.,Llama-2-7B,0.0,1,0,1e-05,0.9746444032158318,0.9329999999999999,0.02378587136868601,0.5906712782297949,0.03387326041191319,0.4529615680881898,0.022529558405746858,0.17365584961134498,0.007052746400281119,0.9711479727132513,0.004934130913988655,0.8831908831908832,0.02891603593003461,0.5596387660002274,0.03594771311341075,0.4279401568170806,0.027010465124066053,0.10041107389135993,0.006099955540692599,0.9116643120381124,0.007061923106032409,0.9885927710282548,0.004116614633043364,0.48376209606309467,0.014166403314249702,0.9888492808338375,0.001496862772045587,0.9839221638885342,0.005172697629831861,0.9228793357882765,0.0033391564038546253,,,,0.9706077188940092,0.017620908359488253,0.5303743109742608,0.03407162338129851,0.9937714403974752,0.0010783212615616724,0.9681058114035087,0.018374271519515418,0.9166079435138229,0.008456020405592082,0.4,4.765788617078215e-07,0.08414634146341464,,,,,,,,,,0.003018184077228396,0.6285644571327744,0.003018184077228396
|
14 |
+
164,0,KL Min.,Llama-2-7B,0.0,1,1,1e-05,0.9746444032158318,0.9329999999999999,0.02378587136868601,0.5926914370142016,0.03380708048334772,0.4552599427511621,0.022397353324240442,0.17548038451057024,0.007054889176896772,0.9701414990793583,0.005048595089360008,0.8917378917378919,0.02791127949453827,0.5606620010502634,0.03589288783261826,0.4313463368160679,0.026893905130676334,0.10109508486948855,0.006048669438358328,0.9115536136563003,0.007054328446766984,0.9866427948861284,0.004164280248771519,0.48380044848689596,0.014028587577548995,0.987079635387015,0.001524838575423045,0.9856550808912471,0.004541405936506324,0.9234270631972602,0.003406348491488958,,,,0.7786513675263843,0.038214845616106496,0.5342827939227608,0.03416607249348546,0.9022485278034719,0.01636718106068851,0.7863602232753086,0.03872457119116467,0.9052995628926588,0.009539580654677837,0.425,4.299272404750809e-07,0.08292682926829269,,,,,,,,,,0.0012708143485281624,0.6305829841958074,0.0012708143485281624
|
15 |
+
165,0,KL Min.,Llama-2-7B,0.0,1,2,1e-05,0.9746444032158318,0.9329999999999999,0.02378587136868601,0.5852513278783095,0.03415700434871471,0.4512026997232316,0.022526850296365288,0.1744369057670915,0.007011106460219607,0.9684490075591609,0.005697520028061312,0.878917378917379,0.02908252649809801,0.5583273505371179,0.03607477677978727,0.42904895977528,0.027004029214984314,0.10027173126835717,0.006095704998244655,0.9102069325105575,0.0071130182494677984,0.9837020298645062,0.004679527798699983,0.4863827807838256,0.014036072547985811,0.9851094086008342,0.0019048629397133007,0.97964844544246,0.005470548235405333,0.9232841112517135,0.003354321867024587,,,,0.6452102127494272,0.038795734192378806,0.5339878688212196,0.03469282005007738,0.7561577607136813,0.033841205404102265,0.640837113817565,0.039597880960097746,0.9005021575058872,0.009514024034688795,0.4,1.634398358874023e-07,0.07195121951219512,,,,,,,,,,0.003018184077228396,0.6274392149443913,0.003018184077228396
|
16 |
+
166,0,KL Min.,Llama-2-7B,0.0,1,3,1e-05,0.9746444032158318,0.9329999999999999,0.02378587136868601,0.5771976816818047,0.034452997218025624,0.4406256089564199,0.022935863913454847,0.17579360511063297,0.007156745309643807,0.9661798328164983,0.005836219904184736,0.878917378917379,0.02908252649809801,0.5505496096178601,0.036126357568608575,0.42045603527182135,0.02714191375993806,0.09428626024741103,0.006039913345791347,0.9011634386488793,0.007877591930412776,0.9631817083850834,0.006755508048376161,0.4901608167131136,0.014162208578683038,0.9758064280747213,0.0031446263998563873,0.9574773675645152,0.007325667723048805,0.9220544162502203,0.0034188156565595406,,,,0.5208700880045747,0.033876535953684686,0.5440980827111798,0.035182167822362186,0.42186229134424025,0.04294040838303995,0.4713160054717275,0.03472033829656913,0.8696356371868526,0.011975877633282655,0.4,1.6943467926466838e-06,0.1,,,,,,,,,,0.003018184077228396,0.6202838445189751,0.003018184077228396
|
17 |
+
167,0,KL Min.,Llama-2-7B,0.0,1,4,1e-05,0.9746444032158318,0.943,0.02184680361707013,0.5692502257120079,0.034771819647641575,0.43256772458393544,0.0233634075991481,0.17679272538606905,0.007668194919986859,0.9662452463366895,0.006148103128195363,0.878917378917379,0.02908252649809801,0.5470188356526116,0.0362099382523936,0.4138519074688882,0.027345791961117884,0.09082474692862029,0.005808831078849859,0.8958202632877043,0.008035621885511554,0.9400564537393836,0.009134905713481647,0.49234372072457055,0.014370784864646631,0.9647276478070979,0.0039017286602883216,0.9235177368548603,0.01012576780838096,0.9189732932079522,0.003530267429751703,,,,0.47597794758075834,0.03239373479241791,0.558581347045137,0.038240055904861195,0.2621098289071951,0.03934582654858117,0.40951543215189046,0.030112049427227196,0.8638400038292596,0.010322399053324752,0.375,2.8431650207494386e-05,0.14146341463414633,,,,,,,,,,0.006760732303569208,0.6146480741594899,0.006760732303569208
|
18 |
+
143,0,Pref. Opt.,Llama-2-7B,0.0,1,0,1e-05,0.9837146980004123,0.9329999999999999,0.02378587136868601,0.5906712782297949,0.03387326041191319,0.4529615680881898,0.022529558405746858,0.17365584961134498,0.007052746400281119,0.9711479727132513,0.004934130913988655,0.8831908831908832,0.02891603593003461,0.5596387660002274,0.03594771311341075,0.4279401568170806,0.027010465124066053,0.10041107389135993,0.006099955540692599,0.9116643120381124,0.007061923106032409,0.9885927710282548,0.004116614633043364,0.48376209606309467,0.014166403314249702,0.9888492808338375,0.001496862772045587,0.9839221638885342,0.005172697629831861,0.9228793357882765,0.0033391564038546253,,,,0.9706077188940092,0.017620908359488253,0.5303743109742608,0.03407162338129851,0.9937714403974752,0.0010783212615616724,0.9681058114035087,0.018374271519515418,0.9166079435138229,0.008456020405592082,0.4,4.765788617078215e-07,0.08414634146341464,,,,,,,,,,0.003018184077228396,0.6285644571327744,0.003018184077228396
|
19 |
+
144,0,Pref. Opt.,Llama-2-7B,0.0,1,1,1e-05,0.9837146980004123,0.9329999999999999,0.02378587136868601,0.5924105428404896,0.033263694434418234,0.4565522451578235,0.021610794050383905,0.1766362229531734,0.007145618092346133,0.9709098974802777,0.0050599919253484765,0.8874643874643875,0.02809493708284436,0.5594055257705869,0.03567260486346218,0.43350943486503823,0.02661437028896882,0.1056862156657845,0.006183210785840322,0.9198611150631801,0.006919614182981682,0.9810836592209436,0.005358997022471166,0.47823084373482894,0.013991136456899415,0.987682564962214,0.0014294465117274482,0.9837301765046863,0.005270907546412638,0.9240710251171401,0.003335151516141506,,,,0.9685243855606759,0.017780552723972488,0.5416122420147298,0.0335048502246019,0.9917345789108578,0.0011589828601444156,0.9660224780701754,0.018520210577111264,0.9166642498201292,0.008456217893549868,0.425,1.6943467926466838e-06,0.1,,,,,,,,,,0.0012708143485281624,0.6296293128306515,0.0012708143485281624
|
20 |
+
145,0,Pref. Opt.,Llama-2-7B,0.0,1,2,1e-05,0.9837146980004123,0.9363333333333332,0.0226726819112893,0.606546647433683,0.030961077053547004,0.46835196679220437,0.019662428798979843,0.18027710108089362,0.007120540722361764,0.9711053228188717,0.005193141445257983,0.8717948717948718,0.029276166353085355,0.5598299511583128,0.03513500053040345,0.4438246441699819,0.025308810405222027,0.10646149121607264,0.006189134075678301,0.9216962290636657,0.006709124114274743,0.9719699980936025,0.0063748268799224865,0.468221641983294,0.013605114756446606,0.9822887429450634,0.0014869938769852837,0.9847992127106778,0.0049558019543791566,0.9257162977066123,0.003308987703675799,,,,0.8186714818241565,0.043115858610446985,0.566483639868165,0.03249111598229366,0.9565788230001161,0.005529587923744388,0.8353519284034615,0.042068217012389,0.9176329318591485,0.008773384722766613,0.425,4.5276301534613594e-06,0.11341463414634147,,,,,,,,,,0.0012708143485281624,0.632871908926051,0.0012708143485281624
|
21 |
+
146,0,Pref. Opt.,Llama-2-7B,0.0,1,3,1e-05,0.9837146980004123,0.9363333333333332,0.0226726819112893,0.6209160392815353,0.02921498876116747,0.47751150900909095,0.018195830443283427,0.18402368903026795,0.007452606075757043,0.971230589018051,0.005180439432376149,0.8660968660968662,0.03016145359937715,0.5636513328534187,0.03397030619562475,0.4500346651850733,0.024116036374058982,0.10894654161447405,0.006392292787809994,0.9267264216214894,0.006596954642520662,0.9394917009335717,0.010209371403798576,0.460885816164811,0.013399740935308158,0.9751565902878809,0.0017260002980401803,0.9733056382182119,0.006991045991164258,0.9287424401721425,0.0033082966207093195,,,,0.5236425314354136,0.06006007523324811,0.5820412789879955,0.03188653465299932,0.9042981066202153,0.008310046664909112,0.5434620650095046,0.061323014422537105,0.9316512654147395,0.010667582742999213,0.375,5.845156920258887e-06,0.11707317073170732,,,,,,,,,,0.006760732303569208,0.6345567312241833,0.006760732303569208
|
22 |
+
147,0,Pref. Opt.,Llama-2-7B,0.0,1,4,1e-05,0.9837146980004123,0.9363333333333332,0.0226726819112893,0.6226602095796977,0.028556734993852778,0.479269047982605,0.017397555112613837,0.19010803523961417,0.007968879579021804,0.971887674038294,0.005207517121420166,0.8917378917378919,0.02724332888874447,0.5622231069115052,0.0336037536961641,0.45085733177400755,0.02340373364616858,0.11387149699825733,0.0061898143954831585,0.9334525928992325,0.006707866917734486,0.905155660984239,0.012720361050411409,0.4567800978942038,0.013256573510614282,0.9686896057092785,0.0019275416460468816,0.961450621340768,0.008536871990541558,0.9323639006302699,0.0032033723924312922,,,,0.15229945036720657,0.049092941234932366,0.5901997851872188,0.031438784846847985,0.8591139219396796,0.00928767343239399,0.18063505337112148,0.0493767152706705,0.9691722958986757,0.010434715487281379,0.375,1.6715837773517706e-05,0.1329268292682927,,,,,,,,,,0.006760732303569208,0.6335834527767225,0.006760732303569208
|
23 |
+
169,0,Retain Model,Llama-2-7B,0.0,1,-1,1e-05,0.0,0.945,0.02105188395801711,0.5926241084713598,0.03345059593050104,0.4544514898987734,0.021893655065203167,0.17353989749500584,0.006538369470852875,0.967232018904305,0.005690027028802709,0.878917378917379,0.02908252649809801,0.5442517457082237,0.03644994289779965,0.4220565650208274,0.027247431184912106,0.10057341165244862,0.006012069013665042,0.9135588025349304,0.006767434505349635,0.9809455309460164,0.0058307259379082295,0.47882616449120396,0.01410518223667099,0.990023753985948,0.0007292641153727538,0.9846272824265296,0.005002917384509446,0.9241821753906638,0.0033307787579352774,,,,0.4057248745903669,0.029331873414771226,0.6701244699861956,0.02808055457287809,0.1736882915925146,0.025915814128189336,0.4039820476083342,0.03168689004734824,0.8936834437422675,0.012238378133721525,0.0,1.0,0.0,,,,,,,,,,1.0,0.6246309817225171,1.0
|
versions/stable-lm.csv
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
Method,Compute,PPL,Truth,ROUGE,MAPO
|
2 |
-
DPO,1,0.0768753815825175,0.3986066518668836,0.9565206583678539,0.8712100761297452
|
3 |
-
DPO,1,0.5996286412275281,0.3602207419553394,0.6659869365178336,0.10860875787554469
|
4 |
-
Grad Ascent,1,0.01276005409910086,0.8739653533368998,0.023760115576687335,0.557119299008513
|
5 |
-
Grad Ascent,1,0.9153365174437643,0.5117768071328227,0.13019174875223205,0.2736769500895253
|
6 |
-
IDK,1,0.9575847571359651,0.14495165859171177,0.5215967278097287,0.9513180970650936
|
7 |
-
IDK,1,0.5081723023409522,0.7260250131902866,0.46407442478973215,0.9008803129332287
|
8 |
-
KL,1,0.23284021819861755,0.7973023013038227,0.9713336423092905,0.674807833567933
|
9 |
-
KL,1,0.04023188230471908,0.7071738714102987,0.4663170982373773,0.6658539062921722
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|