pratyushmaini commited on
Commit
e6406fb
β€’
1 Parent(s): 1aacc3d
Files changed (3) hide show
  1. app.py +14 -2
  2. versions/llama.csv +23 -9
  3. versions/stable-lm.csv +0 -9
app.py CHANGED
@@ -5,7 +5,19 @@ import matplotlib.pyplot as plt
5
  # Function to load data from a given CSV file
6
  def load_data(version):
7
  file_path = f'versions/{version}.csv' # Replace with your file paths
8
- return pd.read_csv(file_path)
 
 
 
 
 
 
 
 
 
 
 
 
9
 
10
  # Function for searching in the leaderboard
11
  def search_leaderboard(df, query):
@@ -36,7 +48,7 @@ with demo:
36
  with gr.TabItem("Leaderboard"):
37
  with gr.Row():
38
  version_dropdown = gr.Dropdown(
39
- choices=["llama", "phi", "stable-lm"],
40
  label="πŸ”„ Select Base Model",
41
  value="llama",
42
  )
 
5
  # Function to load data from a given CSV file
6
  def load_data(version):
7
  file_path = f'versions/{version}.csv' # Replace with your file paths
8
+ df = pd.read_csv(file_path)
9
+ # we only want specific columns and in a specific order
10
+ # column_names : Method,Model,WD,Forget Rate,Epoch,LR,Compute,ROUGE Real Authors,ROUGE SEM Real Authors,Truth Ratio Real Authors,Truth Ratio SEM Real Authors,Prob. Real Authors,Prob. SEM Real Authors,ROUGE-P Real Authors,ROUGE-P SEM Real Authors,TTR Real Authors,TTR SEM Real Authors,ROUGE Real World,ROUGE SEM Real World,Truth Ratio Real World,Truth Ratio SEM Real World,Prob. Real World,Prob. SEM Real World,ROUGE-P Real World,ROUGE-P SEM Real World,TTR Real World,TTR SEM Real World,ROUGE Retain,ROUGE SEM Retain,Truth Ratio Retain,Truth Ratio SEM Retain,Prob. Retain,Prob. SEM Retain,ROUGE-P Retain,ROUGE-P SEM Retain,TTR Retain,TTR SEM Retain,KS Test Retain,Wilcoxon PVal Retain,Wilcoxon Stat Retain,ROUGE Forget,ROUGE SEM Forget,Truth Ratio Forget,Truth Ratio SEM Forget,Prob. Forget,Prob. SEM Forget,ROUGE-P Forget,ROUGE-P SEM Forget,TTR Forget,TTR SEM Forget,KS Test Forget,Wilcoxon PVal Forget,Wilcoxon Stat Forget,KS Test Real Authors,KS Test PVal Real Authors,Wilcoxon PVal Real Authors,Wilcoxon Stat Real Authors,KS Test Real World,KS Test PVal Real World,Wilcoxon PVal Real World,Wilcoxon Stat Real World,KS Test PVal Retain,KS Test PVal Forget,Model Utility,Forget Quality
11
+ column_names = ["Method",
12
+ "Model Utility", "Forget Quality",
13
+ "ROUGE Real Authors", "Truth Ratio Real Authors", "Prob. Real Authors",
14
+ "ROUGE Real World", "Truth Ratio Real World", "Prob. Real World",
15
+ "ROUGE Retain", "Truth Ratio Retain", "Prob. Retain",
16
+ "ROUGE Forget", "Truth Ratio Forget", "Prob. Forget",
17
+ ]
18
+ df = df[column_names]
19
+
20
+ return df
21
 
22
  # Function for searching in the leaderboard
23
  def search_leaderboard(df, query):
 
48
  with gr.TabItem("Leaderboard"):
49
  with gr.Row():
50
  version_dropdown = gr.Dropdown(
51
+ choices=["llama", "phi"],
52
  label="πŸ”„ Select Base Model",
53
  value="llama",
54
  )
versions/llama.csv CHANGED
@@ -1,9 +1,23 @@
1
- Method,Compute,PPL,Truth,ROUGE,MAPO
2
- DPO,1,0.0768753815825175,0.3986066518668836,0.9565206583678539,0.8712100761297452
3
- DPO,1,0.5996286412275281,0.3602207419553394,0.6659869365178336,0.10860875787554469
4
- Grad Ascent,1,0.01276005409910086,0.8739653533368998,0.023760115576687335,0.557119299008513
5
- Grad Ascent,1,0.9153365174437643,0.5117768071328227,0.13019174875223205,0.2736769500895253
6
- IDK,1,0.9575847571359651,0.14495165859171177,0.5215967278097287,0.9513180970650936
7
- IDK,1,0.5081723023409522,0.7260250131902866,0.46407442478973215,0.9008803129332287
8
- KL,1,0.23284021819861755,0.7973023013038227,0.9713336423092905,0.674807833567933
9
- KL,1,0.04023188230471908,0.7071738714102987,0.4663170982373773,0.6658539062921722
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ,index,Method,Model,WD,Forget Rate,Epoch,LR,Compute,ROUGE Real Authors,ROUGE SEM Real Authors,Truth Ratio Real Authors,Truth Ratio SEM Real Authors,Prob. Real Authors,Prob. SEM Real Authors,ROUGE-P Real Authors,ROUGE-P SEM Real Authors,TTR Real Authors,TTR SEM Real Authors,ROUGE Real World,ROUGE SEM Real World,Truth Ratio Real World,Truth Ratio SEM Real World,Prob. Real World,Prob. SEM Real World,ROUGE-P Real World,ROUGE-P SEM Real World,TTR Real World,TTR SEM Real World,ROUGE Retain,ROUGE SEM Retain,Truth Ratio Retain,Truth Ratio SEM Retain,Prob. Retain,Prob. SEM Retain,ROUGE-P Retain,ROUGE-P SEM Retain,TTR Retain,TTR SEM Retain,KS Test Retain,Wilcoxon PVal Retain,Wilcoxon Stat Retain,ROUGE Forget,ROUGE SEM Forget,Truth Ratio Forget,Truth Ratio SEM Forget,Prob. Forget,Prob. SEM Forget,ROUGE-P Forget,ROUGE-P SEM Forget,TTR Forget,TTR SEM Forget,KS Test Forget,Wilcoxon PVal Forget,Wilcoxon Stat Forget,KS Test Real Authors,KS Test PVal Real Authors,Wilcoxon PVal Real Authors,Wilcoxon Stat Real Authors,KS Test Real World,KS Test PVal Real World,Wilcoxon PVal Real World,Wilcoxon Stat Real World,KS Test PVal Retain,KS Test PVal Forget,Model Utility,Forget Quality
2
+ 254,0,Finetune Model,Llama-2-7B,0.0,0,-1,1e-05,0.0,0.9329999999999999,0.02378587136868601,0.5906712782297949,0.03387326041191319,0.4529615680881898,0.022529558405746858,0.17365584961134498,0.007052746400281119,0.9711479727132513,0.004934130913988655,0.8831908831908832,0.02891603593003461,0.5596387660002274,0.03594771311341075,0.4279401568170806,0.027010465124066053,0.10041107389135993,0.006099955540692599,0.9116643120381124,0.007061923106032409,0.9885927710282548,0.004116614633043364,0.48376209606309467,0.014166403314249702,0.9888492808338375,0.001496862772045587,0.9839221638885342,0.005172697629831861,0.9228793357882765,0.0033391564038546253,,,,0.9844665453461495,0.0051727714413351816,0.5021345577886491,0.013075097432894608,0.9905248646281772,0.0007461848129786882,0.9876392022245997,0.004309388867036841,0.9158566386007846,0.0035939738499808516,0.38,4.709184258054772e-44,0.036345514950166115,,,,,,,,,,1.096624314778916e-19,0.6285644571327744,1.096624314778916e-19
3
+ 153,0,Grad. Ascent,Llama-2-7B,0.0,1,0,1e-05,0.98989898989899,0.9329999999999999,0.02378587136868601,0.5906712782297949,0.03387326041191319,0.4529615680881898,0.022529558405746858,0.17365584961134498,0.007052746400281119,0.9711479727132513,0.004934130913988655,0.8831908831908832,0.02891603593003461,0.5596387660002274,0.03594771311341075,0.4279401568170806,0.027010465124066053,0.10041107389135993,0.006099955540692599,0.9116643120381124,0.007061923106032409,0.9885927710282548,0.004116614633043364,0.48376209606309467,0.014166403314249702,0.9888492808338375,0.001496862772045587,0.9839221638885342,0.005172697629831861,0.9228793357882765,0.0033391564038546253,,,,0.9706077188940092,0.017620908359488253,0.5303743109742608,0.03407162338129851,0.9937714403974752,0.0010783212615616724,0.9681058114035087,0.018374271519515418,0.9166079435138229,0.008456020405592082,0.4,4.765788617078215e-07,0.08414634146341464,,,,,,,,,,0.003018184077228396,0.6285644571327744,0.003018184077228396
4
+ 154,0,Grad. Ascent,Llama-2-7B,0.0,1,1,1e-05,0.98989898989899,0.9329999999999999,0.02378587136868601,0.5900429345628848,0.033905759300725195,0.4547378833757618,0.022335305669671995,0.1755233138034995,0.007054415039534881,0.9705581657460249,0.005055939888176935,0.8874643874643875,0.02809493708284436,0.5601436387215902,0.03594055775086999,0.4311578250642015,0.026881223608336224,0.101544103709312,0.006030005405901275,0.9125813125165163,0.0071185045685729365,0.9889397136536354,0.0037059751472614064,0.48344775524839767,0.01405782374996479,0.9872371886220882,0.0014907038206082325,0.987697022848052,0.004142802637345347,0.9232821917154683,0.0034525307216189344,,,,0.7761951905387826,0.03772874843774116,0.5348676866651111,0.034412833437561345,0.8994496957903285,0.01639860932264404,0.7697821692084698,0.03782303934764471,0.9036587801876312,0.009903910085434673,0.425,3.489894879749045e-07,0.08048780487804878,,,,,,,,,,0.0012708143485281624,0.6298261119892148,0.0012708143485281624
5
+ 155,0,Grad. Ascent,Llama-2-7B,0.0,1,2,1e-05,0.98989898989899,0.9329999999999999,0.02378587136868601,0.5873988265455783,0.03397508491678948,0.4508092646908872,0.022551229274736694,0.1739081567383425,0.007062546425329464,0.9665255339610767,0.005908090892117214,0.8760683760683761,0.029119795619916317,0.5583610983349427,0.03599265069970819,0.4281143594726287,0.026936659748423613,0.09949787624348999,0.005927416138043877,0.9107472606370924,0.0070831369098684925,0.9829393276544355,0.004747087133082975,0.4874752426550318,0.014033035101973904,0.9855465733622553,0.0018392288196213203,0.9823404390280708,0.0048268090647223105,0.9234222857023673,0.00337002024051439,,,,0.6634498511248423,0.03979501310983266,0.5330159294477221,0.03463020113629034,0.7603332595788647,0.033966656011972296,0.6583112962777088,0.039468344041597575,0.9078713971845589,0.009329761694848934,0.425,2.0396328181959689e-07,0.07439024390243902,,,,,,,,,,0.0012708143485281624,0.6274349162486959,0.0012708143485281624
6
+ 156,0,Grad. Ascent,Llama-2-7B,0.0,1,3,1e-05,0.98989898989899,0.9329999999999999,0.02378587136868601,0.5767494734917964,0.034372249724000214,0.4408938678030151,0.02287028723794112,0.1750376753678611,0.007158422081483091,0.9663828541959902,0.00575613164904337,0.8917378917378919,0.02791127949453827,0.5513137330681693,0.03617204964693906,0.42021024790475425,0.027096090976780653,0.09769306113650794,0.0059427576527659514,0.9055722933002827,0.007772959154843439,0.9616573619305047,0.006924760552611335,0.4892999713770692,0.014168689417265349,0.9774506636931869,0.0028459379602567628,0.9583282920447302,0.007198221797581762,0.9220386919418376,0.003423647927837329,,,,0.5121226937822042,0.032962969948126364,0.54345131884367,0.034968297994459455,0.43023176455719464,0.04345304441763552,0.470313608214277,0.03389656752927492,0.8711500171294493,0.010297842300251473,0.375,5.841629899805412e-07,0.08658536585365853,,,,,,,,,,0.006760732303569208,0.6208832381499613,0.006760732303569208
7
+ 157,0,Grad. Ascent,Llama-2-7B,0.0,1,4,1e-05,0.98989898989899,0.943,0.02184680361707013,0.569912690980619,0.03466840517291862,0.43204434512382306,0.023307965482841985,0.17792390999093788,0.007721143710477113,0.9666332582272671,0.0057618895495265676,0.8831908831908832,0.028916035930034605,0.5473668144428057,0.03622314683593883,0.414897165484955,0.027344081869356943,0.09466068410867952,0.006050371078030876,0.8990135186717393,0.007874996621043741,0.9360858953948274,0.009325230518351905,0.49302946184701624,0.014332776372096316,0.9674047600471735,0.003620235746904036,0.9232295288474817,0.01000286376090822,0.9195202169991762,0.0035090468594729846,,,,0.4726138841044719,0.03209104244253,0.5596537628394563,0.038582904584907325,0.273127242585076,0.040910247561870554,0.4193707732983415,0.03496432463333179,0.8648833328747095,0.010606785895688082,0.35,2.8431650207494386e-05,0.14146341463414633,,,,,,,,,,0.01430154804770646,0.6152017367360003,0.01430154804770646
8
+ 133,0,Grad. Diff.,Llama-2-7B,0.0,1,0,1e-05,0.9837146980004123,0.9329999999999999,0.02378587136868601,0.5906712782297949,0.03387326041191319,0.4529615680881898,0.022529558405746858,0.17365584961134498,0.007052746400281119,0.9711479727132513,0.004934130913988655,0.8831908831908832,0.02891603593003461,0.5596387660002274,0.03594771311341075,0.4279401568170806,0.027010465124066053,0.10041107389135993,0.006099955540692599,0.9116643120381124,0.007061923106032409,0.9885927710282548,0.004116614633043364,0.48376209606309467,0.014166403314249702,0.9888492808338375,0.001496862772045587,0.9839221638885342,0.005172697629831861,0.9228793357882765,0.0033391564038546253,,,,0.9706077188940092,0.017620908359488253,0.5303743109742608,0.03407162338129851,0.9937714403974752,0.0010783212615616724,0.9681058114035087,0.018374271519515418,0.9166079435138229,0.008456020405592082,0.4,4.765788617078215e-07,0.08414634146341464,,,,,,,,,,0.003018184077228396,0.6285644571327744,0.003018184077228396
9
+ 134,0,Grad. Diff.,Llama-2-7B,0.0,1,1,1e-05,0.9837146980004123,0.9329999999999999,0.02378587136868601,0.5831342368229205,0.034195526749926465,0.4463399542137994,0.022676754446149583,0.1741332194637148,0.007005056236897536,0.9711427967298144,0.004892496292632562,0.8746438746438747,0.02986595450792445,0.5553851084435623,0.03611651818945058,0.42606843965321073,0.02705610226448954,0.09996325669567287,0.006159195821413578,0.9108871819027446,0.007062997168334457,0.9881749522878556,0.00403912406410768,0.48451691239938044,0.014172133539883811,0.9886402516003234,0.0015158301664681946,0.984391926889841,0.00497080235933812,0.9225775765926555,0.0033693716971956124,,,,0.8470500248532187,0.03425612789078735,0.5321108595821069,0.0345352995124133,0.9437253641548825,0.010302771440246095,0.8551610918357241,0.0338847158578802,0.9129679236930579,0.008755089796400987,0.425,3.489894879749045e-07,0.08048780487804878,,,,,,,,,,0.0012708143485281624,0.6247652337390697,0.0012708143485281624
10
+ 135,0,Grad. Diff.,Llama-2-7B,0.0,1,2,1e-05,0.9837146980004123,0.9329999999999999,0.02378587136868601,0.5743689863204028,0.03459778800824567,0.4395178398225532,0.02291569750507518,0.17573586844871675,0.0071367315805213145,0.971376699089106,0.004833659056828999,0.8846153846153846,0.02814097500969468,0.5500806928206896,0.03629220886455765,0.4206527134660717,0.027177369607437277,0.10089550395690719,0.005891426629145233,0.9103603531622805,0.007225732932586464,0.9876166503747148,0.003958159615863906,0.48619738136346835,0.014218352461945517,0.9870674423893376,0.0017276553352510255,0.9834584001935912,0.005012665963437899,0.9230005342696567,0.003320496577337283,,,,0.693891532134268,0.040761864873975456,0.5313708135093245,0.03468764401794746,0.7907704753851272,0.03193867027599963,0.697210810027939,0.0408282479347697,0.9117740693087659,0.008923458576449092,0.425,3.1401395972352475e-07,0.07926829268292683,,,,,,,,,,0.0012708143485281624,0.620856677526391,0.0012708143485281624
11
+ 136,0,Grad. Diff.,Llama-2-7B,0.0,1,3,1e-05,0.9837146980004123,0.9229999999999999,0.02553883950441608,0.5588856115278307,0.03486192436995179,0.42454388004631033,0.023382520023456987,0.17113257408226445,0.006696328375983813,0.971384233041181,0.004872506472042895,0.8660968660968662,0.030161453599377153,0.5440843064984168,0.03625778397852338,0.4103980888734902,0.02752113340668667,0.09743177268489672,0.006137860799523201,0.9075885179544705,0.007384150110357787,0.9567632211441702,0.008380284589874188,0.4919675035655331,0.014354171258223164,0.9788901898126867,0.002587745577928834,0.9498857465693834,0.009150898069415532,0.9209175410960485,0.0035039275462926496,,,,0.5611743395394859,0.0361031249078284,0.5357745264531568,0.035138959954993894,0.48186478504437824,0.04263428759390712,0.5391800516220583,0.0371989002115956,0.8954952252076869,0.010479046564108179,0.4,1.055741449818015e-06,0.09390243902439024,,,,,,,,,,0.003018184077228396,0.6098886454382855,0.003018184077228396
12
+ 137,0,Grad. Diff.,Llama-2-7B,0.0,1,4,1e-05,0.9837146980004123,0.9229999999999999,0.02553883950441608,0.5495203912493695,0.03510662588135505,0.41377046154740876,0.023744863866831466,0.16752673547642588,0.006608755494593228,0.9705274573313899,0.005449214872377944,0.8703703703703705,0.03001669034410197,0.5372712890340352,0.036215753077327884,0.40173797204393547,0.02764724919841151,0.09540026299698359,0.006152647895052731,0.9050756487748767,0.007502582140361348,0.916460247115961,0.010795592976781397,0.49330805534207384,0.014632422453902047,0.965061026568477,0.0034352591571064324,0.9011082675444243,0.011800933253074398,0.9188436974164093,0.0036434938209770657,,,,0.49253655875189073,0.03322129247825073,0.542568072727047,0.03635081642015713,0.2987510252217606,0.040704356395482096,0.442433429498021,0.03283629382771646,0.8643185765471209,0.012045353707243911,0.35,1.6715837773517706e-05,0.1329268292682927,,,,,,,,,,0.01430154804770646,0.601047475651797,0.01430154804770646
13
+ 163,0,KL Min.,Llama-2-7B,0.0,1,0,1e-05,0.9746444032158318,0.9329999999999999,0.02378587136868601,0.5906712782297949,0.03387326041191319,0.4529615680881898,0.022529558405746858,0.17365584961134498,0.007052746400281119,0.9711479727132513,0.004934130913988655,0.8831908831908832,0.02891603593003461,0.5596387660002274,0.03594771311341075,0.4279401568170806,0.027010465124066053,0.10041107389135993,0.006099955540692599,0.9116643120381124,0.007061923106032409,0.9885927710282548,0.004116614633043364,0.48376209606309467,0.014166403314249702,0.9888492808338375,0.001496862772045587,0.9839221638885342,0.005172697629831861,0.9228793357882765,0.0033391564038546253,,,,0.9706077188940092,0.017620908359488253,0.5303743109742608,0.03407162338129851,0.9937714403974752,0.0010783212615616724,0.9681058114035087,0.018374271519515418,0.9166079435138229,0.008456020405592082,0.4,4.765788617078215e-07,0.08414634146341464,,,,,,,,,,0.003018184077228396,0.6285644571327744,0.003018184077228396
14
+ 164,0,KL Min.,Llama-2-7B,0.0,1,1,1e-05,0.9746444032158318,0.9329999999999999,0.02378587136868601,0.5926914370142016,0.03380708048334772,0.4552599427511621,0.022397353324240442,0.17548038451057024,0.007054889176896772,0.9701414990793583,0.005048595089360008,0.8917378917378919,0.02791127949453827,0.5606620010502634,0.03589288783261826,0.4313463368160679,0.026893905130676334,0.10109508486948855,0.006048669438358328,0.9115536136563003,0.007054328446766984,0.9866427948861284,0.004164280248771519,0.48380044848689596,0.014028587577548995,0.987079635387015,0.001524838575423045,0.9856550808912471,0.004541405936506324,0.9234270631972602,0.003406348491488958,,,,0.7786513675263843,0.038214845616106496,0.5342827939227608,0.03416607249348546,0.9022485278034719,0.01636718106068851,0.7863602232753086,0.03872457119116467,0.9052995628926588,0.009539580654677837,0.425,4.299272404750809e-07,0.08292682926829269,,,,,,,,,,0.0012708143485281624,0.6305829841958074,0.0012708143485281624
15
+ 165,0,KL Min.,Llama-2-7B,0.0,1,2,1e-05,0.9746444032158318,0.9329999999999999,0.02378587136868601,0.5852513278783095,0.03415700434871471,0.4512026997232316,0.022526850296365288,0.1744369057670915,0.007011106460219607,0.9684490075591609,0.005697520028061312,0.878917378917379,0.02908252649809801,0.5583273505371179,0.03607477677978727,0.42904895977528,0.027004029214984314,0.10027173126835717,0.006095704998244655,0.9102069325105575,0.0071130182494677984,0.9837020298645062,0.004679527798699983,0.4863827807838256,0.014036072547985811,0.9851094086008342,0.0019048629397133007,0.97964844544246,0.005470548235405333,0.9232841112517135,0.003354321867024587,,,,0.6452102127494272,0.038795734192378806,0.5339878688212196,0.03469282005007738,0.7561577607136813,0.033841205404102265,0.640837113817565,0.039597880960097746,0.9005021575058872,0.009514024034688795,0.4,1.634398358874023e-07,0.07195121951219512,,,,,,,,,,0.003018184077228396,0.6274392149443913,0.003018184077228396
16
+ 166,0,KL Min.,Llama-2-7B,0.0,1,3,1e-05,0.9746444032158318,0.9329999999999999,0.02378587136868601,0.5771976816818047,0.034452997218025624,0.4406256089564199,0.022935863913454847,0.17579360511063297,0.007156745309643807,0.9661798328164983,0.005836219904184736,0.878917378917379,0.02908252649809801,0.5505496096178601,0.036126357568608575,0.42045603527182135,0.02714191375993806,0.09428626024741103,0.006039913345791347,0.9011634386488793,0.007877591930412776,0.9631817083850834,0.006755508048376161,0.4901608167131136,0.014162208578683038,0.9758064280747213,0.0031446263998563873,0.9574773675645152,0.007325667723048805,0.9220544162502203,0.0034188156565595406,,,,0.5208700880045747,0.033876535953684686,0.5440980827111798,0.035182167822362186,0.42186229134424025,0.04294040838303995,0.4713160054717275,0.03472033829656913,0.8696356371868526,0.011975877633282655,0.4,1.6943467926466838e-06,0.1,,,,,,,,,,0.003018184077228396,0.6202838445189751,0.003018184077228396
17
+ 167,0,KL Min.,Llama-2-7B,0.0,1,4,1e-05,0.9746444032158318,0.943,0.02184680361707013,0.5692502257120079,0.034771819647641575,0.43256772458393544,0.0233634075991481,0.17679272538606905,0.007668194919986859,0.9662452463366895,0.006148103128195363,0.878917378917379,0.02908252649809801,0.5470188356526116,0.0362099382523936,0.4138519074688882,0.027345791961117884,0.09082474692862029,0.005808831078849859,0.8958202632877043,0.008035621885511554,0.9400564537393836,0.009134905713481647,0.49234372072457055,0.014370784864646631,0.9647276478070979,0.0039017286602883216,0.9235177368548603,0.01012576780838096,0.9189732932079522,0.003530267429751703,,,,0.47597794758075834,0.03239373479241791,0.558581347045137,0.038240055904861195,0.2621098289071951,0.03934582654858117,0.40951543215189046,0.030112049427227196,0.8638400038292596,0.010322399053324752,0.375,2.8431650207494386e-05,0.14146341463414633,,,,,,,,,,0.006760732303569208,0.6146480741594899,0.006760732303569208
18
+ 143,0,Pref. Opt.,Llama-2-7B,0.0,1,0,1e-05,0.9837146980004123,0.9329999999999999,0.02378587136868601,0.5906712782297949,0.03387326041191319,0.4529615680881898,0.022529558405746858,0.17365584961134498,0.007052746400281119,0.9711479727132513,0.004934130913988655,0.8831908831908832,0.02891603593003461,0.5596387660002274,0.03594771311341075,0.4279401568170806,0.027010465124066053,0.10041107389135993,0.006099955540692599,0.9116643120381124,0.007061923106032409,0.9885927710282548,0.004116614633043364,0.48376209606309467,0.014166403314249702,0.9888492808338375,0.001496862772045587,0.9839221638885342,0.005172697629831861,0.9228793357882765,0.0033391564038546253,,,,0.9706077188940092,0.017620908359488253,0.5303743109742608,0.03407162338129851,0.9937714403974752,0.0010783212615616724,0.9681058114035087,0.018374271519515418,0.9166079435138229,0.008456020405592082,0.4,4.765788617078215e-07,0.08414634146341464,,,,,,,,,,0.003018184077228396,0.6285644571327744,0.003018184077228396
19
+ 144,0,Pref. Opt.,Llama-2-7B,0.0,1,1,1e-05,0.9837146980004123,0.9329999999999999,0.02378587136868601,0.5924105428404896,0.033263694434418234,0.4565522451578235,0.021610794050383905,0.1766362229531734,0.007145618092346133,0.9709098974802777,0.0050599919253484765,0.8874643874643875,0.02809493708284436,0.5594055257705869,0.03567260486346218,0.43350943486503823,0.02661437028896882,0.1056862156657845,0.006183210785840322,0.9198611150631801,0.006919614182981682,0.9810836592209436,0.005358997022471166,0.47823084373482894,0.013991136456899415,0.987682564962214,0.0014294465117274482,0.9837301765046863,0.005270907546412638,0.9240710251171401,0.003335151516141506,,,,0.9685243855606759,0.017780552723972488,0.5416122420147298,0.0335048502246019,0.9917345789108578,0.0011589828601444156,0.9660224780701754,0.018520210577111264,0.9166642498201292,0.008456217893549868,0.425,1.6943467926466838e-06,0.1,,,,,,,,,,0.0012708143485281624,0.6296293128306515,0.0012708143485281624
20
+ 145,0,Pref. Opt.,Llama-2-7B,0.0,1,2,1e-05,0.9837146980004123,0.9363333333333332,0.0226726819112893,0.606546647433683,0.030961077053547004,0.46835196679220437,0.019662428798979843,0.18027710108089362,0.007120540722361764,0.9711053228188717,0.005193141445257983,0.8717948717948718,0.029276166353085355,0.5598299511583128,0.03513500053040345,0.4438246441699819,0.025308810405222027,0.10646149121607264,0.006189134075678301,0.9216962290636657,0.006709124114274743,0.9719699980936025,0.0063748268799224865,0.468221641983294,0.013605114756446606,0.9822887429450634,0.0014869938769852837,0.9847992127106778,0.0049558019543791566,0.9257162977066123,0.003308987703675799,,,,0.8186714818241565,0.043115858610446985,0.566483639868165,0.03249111598229366,0.9565788230001161,0.005529587923744388,0.8353519284034615,0.042068217012389,0.9176329318591485,0.008773384722766613,0.425,4.5276301534613594e-06,0.11341463414634147,,,,,,,,,,0.0012708143485281624,0.632871908926051,0.0012708143485281624
21
+ 146,0,Pref. Opt.,Llama-2-7B,0.0,1,3,1e-05,0.9837146980004123,0.9363333333333332,0.0226726819112893,0.6209160392815353,0.02921498876116747,0.47751150900909095,0.018195830443283427,0.18402368903026795,0.007452606075757043,0.971230589018051,0.005180439432376149,0.8660968660968662,0.03016145359937715,0.5636513328534187,0.03397030619562475,0.4500346651850733,0.024116036374058982,0.10894654161447405,0.006392292787809994,0.9267264216214894,0.006596954642520662,0.9394917009335717,0.010209371403798576,0.460885816164811,0.013399740935308158,0.9751565902878809,0.0017260002980401803,0.9733056382182119,0.006991045991164258,0.9287424401721425,0.0033082966207093195,,,,0.5236425314354136,0.06006007523324811,0.5820412789879955,0.03188653465299932,0.9042981066202153,0.008310046664909112,0.5434620650095046,0.061323014422537105,0.9316512654147395,0.010667582742999213,0.375,5.845156920258887e-06,0.11707317073170732,,,,,,,,,,0.006760732303569208,0.6345567312241833,0.006760732303569208
22
+ 147,0,Pref. Opt.,Llama-2-7B,0.0,1,4,1e-05,0.9837146980004123,0.9363333333333332,0.0226726819112893,0.6226602095796977,0.028556734993852778,0.479269047982605,0.017397555112613837,0.19010803523961417,0.007968879579021804,0.971887674038294,0.005207517121420166,0.8917378917378919,0.02724332888874447,0.5622231069115052,0.0336037536961641,0.45085733177400755,0.02340373364616858,0.11387149699825733,0.0061898143954831585,0.9334525928992325,0.006707866917734486,0.905155660984239,0.012720361050411409,0.4567800978942038,0.013256573510614282,0.9686896057092785,0.0019275416460468816,0.961450621340768,0.008536871990541558,0.9323639006302699,0.0032033723924312922,,,,0.15229945036720657,0.049092941234932366,0.5901997851872188,0.031438784846847985,0.8591139219396796,0.00928767343239399,0.18063505337112148,0.0493767152706705,0.9691722958986757,0.010434715487281379,0.375,1.6715837773517706e-05,0.1329268292682927,,,,,,,,,,0.006760732303569208,0.6335834527767225,0.006760732303569208
23
+ 169,0,Retain Model,Llama-2-7B,0.0,1,-1,1e-05,0.0,0.945,0.02105188395801711,0.5926241084713598,0.03345059593050104,0.4544514898987734,0.021893655065203167,0.17353989749500584,0.006538369470852875,0.967232018904305,0.005690027028802709,0.878917378917379,0.02908252649809801,0.5442517457082237,0.03644994289779965,0.4220565650208274,0.027247431184912106,0.10057341165244862,0.006012069013665042,0.9135588025349304,0.006767434505349635,0.9809455309460164,0.0058307259379082295,0.47882616449120396,0.01410518223667099,0.990023753985948,0.0007292641153727538,0.9846272824265296,0.005002917384509446,0.9241821753906638,0.0033307787579352774,,,,0.4057248745903669,0.029331873414771226,0.6701244699861956,0.02808055457287809,0.1736882915925146,0.025915814128189336,0.4039820476083342,0.03168689004734824,0.8936834437422675,0.012238378133721525,0.0,1.0,0.0,,,,,,,,,,1.0,0.6246309817225171,1.0
versions/stable-lm.csv DELETED
@@ -1,9 +0,0 @@
1
- Method,Compute,PPL,Truth,ROUGE,MAPO
2
- DPO,1,0.0768753815825175,0.3986066518668836,0.9565206583678539,0.8712100761297452
3
- DPO,1,0.5996286412275281,0.3602207419553394,0.6659869365178336,0.10860875787554469
4
- Grad Ascent,1,0.01276005409910086,0.8739653533368998,0.023760115576687335,0.557119299008513
5
- Grad Ascent,1,0.9153365174437643,0.5117768071328227,0.13019174875223205,0.2736769500895253
6
- IDK,1,0.9575847571359651,0.14495165859171177,0.5215967278097287,0.9513180970650936
7
- IDK,1,0.5081723023409522,0.7260250131902866,0.46407442478973215,0.9008803129332287
8
- KL,1,0.23284021819861755,0.7973023013038227,0.9713336423092905,0.674807833567933
9
- KL,1,0.04023188230471908,0.7071738714102987,0.4663170982373773,0.6658539062921722