-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathevaldata.csv
We can make this file beautiful and searchable if this error is corrected: It looks like row 4 should actually have 3 columns, instead of 5 in line 3.
252 lines (252 loc) · 19.7 KB
/
evaldata.csv
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
chatgpt_temp_0_0,Base,0.7317073170731707
chatgpt_temp_0_0,Base + Extra,0.6341463414634146
chatgpt_temp_0_0,PropertyEval,0.6036585365853658
chatgpt_temp_0_8,Base,0.6939024390243903,0.886286656168262,0.9397098686084713
chatgpt_temp_0_8,Base + Extra,0.6246646341463414,0.8191825337254691,0.9067359333662424
chatgpt_temp_0_8,PropertyEval,0.5844207317073171,0.7926273483697817,0.8759342227375865
codegen_16b_temp_0_0,Base,0.32926829268292684
codegen_16b_temp_0_0,Base + Extra,0.2682926829268293
codegen_16b_temp_0_0,PropertyEval,0.24390243902439024
codegen_16b_temp_0_2,Base,0.32167682926829266,0.47925658524663295,0.6332515860851005
codegen_16b_temp_0_2,Base + Extra,0.2696341463414635,0.40304404158720697,0.5558250629210418
codegen_16b_temp_0_2,PropertyEval,0.2553048780487805,0.3914593724921816,0.5452095154066203
codegen_16b_temp_0_4,Base,0.3070426829268293,0.5418539794689412,0.7484750056748218
codegen_16b_temp_0_4,Base + Extra,0.25878048780487806,0.4684927286710685,0.6785749219973927
codegen_16b_temp_0_4,PropertyEval,0.24743902439024398,0.458803619423488,0.6614521110675954
codegen_16b_temp_0_6,Base,0.27771341463414634,0.5579937913101685,0.810789608725638
codegen_16b_temp_0_6,Base + Extra,0.23298780487804874,0.4840911395133365,0.7163388424129942
codegen_16b_temp_0_6,PropertyEval,0.22390243902439025,0.4736373738775247,0.7152013771843371
codegen_16b_temp_0_8,Base,0.23246951219512196,0.5308763528755898,0.8179682291406021
codegen_16b_temp_0_8,Base + Extra,0.1925609756097561,0.45504670964723876,0.7200921336182282
codegen_16b_temp_0_8,PropertyEval,0.18695121951219512,0.4459334084068244,0.7122693882158975
codegen2_16b_temp_0_0,Base,0.1951219512195122
codegen2_16b_temp_0_0,Base + Extra,0.16463414634146342
codegen2_16b_temp_0_0,PropertyEval,0.15853658536585366
codegen2_1b_temp_0_0,Base,0.10975609756097561
codegen2_1b_temp_0_0,Base + Extra,0.09146341463414634
codegen2_1b_temp_0_0,PropertyEval,0.09146341463414634
codegen2_1b_temp_0_2,Base,0.10198170731707318,0.1333203857549203,0.15321920582780713
codegen2_1b_temp_0_2,Base + Extra,0.08664634146341466,0.12061482533334908,0.13492767717120013
codegen2_1b_temp_0_2,PropertyEval,0.08823170731707318,0.12273629745313251,0.13796658993064942
codegen2_1b_temp_0_4,Base,0.09576219512195121,0.14415618929472213,0.19707432816915982
codegen2_1b_temp_0_4,Base + Extra,0.0799390243902439,0.1318157590274999,0.17132321241536094
codegen2_1b_temp_0_4,PropertyEval,0.08192073170731706,0.13009191649100638,0.1698157923446381
codegen2_1b_temp_0_6,Base,0.08344512195121952,0.15047811106771694,0.2434637176211163
codegen2_1b_temp_0_6,Base + Extra,0.06850609756097562,0.13715582154138264,0.21496123770903564
codegen2_1b_temp_0_6,PropertyEval,0.07109756097560976,0.13510184143603474,0.21039584492452143
codegen2_1b_temp_0_8,Base,0.06792682926829269,0.14448503173328955,0.24403727402765926
codegen2_1b_temp_0_8,Base + Extra,0.05612804878048781,0.1287423933201593,0.2090725285210444
codegen2_1b_temp_0_8,PropertyEval,0.057682926829268295,0.12573340262733956,0.19922025877522767
codegen2_3b_temp_0_0,Base,0.15853658536585366
codegen2_3b_temp_0_0,Base + Extra,0.12804878048780488
codegen2_3b_temp_0_0,PropertyEval,0.13414634146341464
codegen2_3b_temp_0_2,Base,0.15213414634146344,0.2113224640834067,0.26692539806191573
codegen2_3b_temp_0_2,Base + Extra,0.1285975609756098,0.18084085902754415,0.22463280669016977
codegen2_3b_temp_0_2,PropertyEval,0.12939024390243903,0.18458722996328106,0.23377904256175913
codegen2_3b_temp_0_4,Base,0.14359756097560977,0.23925298009086152,0.3331556406427196
codegen2_3b_temp_0_4,Base + Extra,0.12292682926829268,0.212455349374522,0.2950559927365617
codegen2_3b_temp_0_4,PropertyEval,0.12289634146341465,0.21133130432802336,0.29292283832479593
codegen2_3b_temp_0_6,Base,0.12496951219512195,0.24094008027614652,0.3724104082234322
codegen2_3b_temp_0_6,Base + Extra,0.10710365853658538,0.21287092548002562,0.3178394500851279
codegen2_3b_temp_0_6,PropertyEval,0.10780487804878051,0.21219031940653874,0.3221050021778091
codegen2_3b_temp_0_8,Base,0.0971036585365854,0.22377549346749256,0.3812113977958528
codegen2_3b_temp_0_8,Base + Extra,0.08368902439024392,0.20103217673267354,0.34699951640936955
codegen2_3b_temp_0_8,PropertyEval,0.08396341463414636,0.19870797587642638,0.33957977970619985
codegen2_7b_temp_0_0,Base,0.18292682926829268
codegen2_7b_temp_0_0,Base + Extra,0.16463414634146342
codegen2_7b_temp_0_0,PropertyEval,0.16463414634146342
codegen2_7b_temp_0_2,Base,0.17935975609756097,0.24457519118329005,0.30629698590112664
codegen2_7b_temp_0_2,Base + Extra,0.15929878048780488,0.21624415615901166,0.2681652968269193
codegen2_7b_temp_0_2,PropertyEval,0.15560975609756098,0.20378217733217188,0.25005366116769534
codegen2_7b_temp_0_4,Base,0.16832317073170733,0.2981949579872966,0.4310221877827216
codegen2_7b_temp_0_4,Base + Extra,0.1472560975609756,0.26426146879272805,0.38710118378435343
codegen2_7b_temp_0_4,PropertyEval,0.1442378048780488,0.2517302549835056,0.3665126943533281
codegen2_7b_temp_0_6,Base,0.14643292682926828,0.30850838891372223,0.47462198955763557
codegen2_7b_temp_0_6,Base + Extra,0.12615853658536583,0.2668114627221984,0.4271273624469881
codegen2_7b_temp_0_6,PropertyEval,0.12557926829268293,0.2609413002790326,0.41774733198928193
codegen2_7b_temp_0_8,Base,0.12097560975609756,0.30122705808558403,0.5087094156692366
codegen2_7b_temp_0_8,Base + Extra,0.10280487804878048,0.2606281371716354,0.45992722303298816
codegen2_7b_temp_0_8,PropertyEval,0.10259146341463414,0.25258113058483533,0.42988445541302045
codegen_2b_temp_0_0,Base,0.24390243902439024
codegen_2b_temp_0_0,Base + Extra,0.21341463414634146
codegen_2b_temp_0_0,PropertyEval,0.21341463414634146
codegen_2b_temp_0_2,Base,0.18378048780487807,0.39505133946766896,0.6323527569010247
codegen_2b_temp_0_2,Base + Extra,0.1529878048780488,0.3511036565634375,0.5675433477107096
codegen_2b_temp_0_2,PropertyEval,0.15564024390243905,0.34404244187918626,0.5534303063666864
codegen_2b_temp_0_4,Base,0.17966463414634143,0.38514194480779157,0.6138412225452582
codegen_2b_temp_0_4,Base + Extra,0.1496951219512195,0.3405473900023394,0.5524090499266582
codegen_2b_temp_0_4,PropertyEval,0.15070121951219512,0.3294949194293088,0.5317806059472973
codegen_2b_temp_0_6,Base,0.18118902439024387,0.3883885310857744,0.6197518296209853
codegen_2b_temp_0_6,Base + Extra,0.15036585365853655,0.34334330524761714,0.5426430278227885
codegen_2b_temp_0_6,PropertyEval,0.15384146341463417,0.3341035349625099,0.5357434056540156
codegen_2b_temp_0_8,Base,0.1834451219512195,0.395870951051275,0.6639588664265273
codegen_2b_temp_0_8,Base + Extra,0.1509451219512195,0.3451960051289364,0.5594930815492645
codegen_2b_temp_0_8,PropertyEval,0.15359756097560975,0.33870213999510995,0.5612709681669796
codegen_6b_temp_0_0,Base,0.2926829268292683
codegen_6b_temp_0_0,Base + Extra,0.25
codegen_6b_temp_0_0,PropertyEval,0.24390243902439024
codegen_6b_temp_0_2,Base,0.2764024390243902,0.39758896561152185,0.4860250756979426
codegen_6b_temp_0_2,Base + Extra,0.23426829268292684,0.34831615475835037,0.4217652426923288
codegen_6b_temp_0_2,PropertyEval,0.22140243902439025,0.3290399869013478,0.41846806207858867
codegen_6b_temp_0_4,Base,0.2626829268292683,0.45192389132129673,0.6566919949589086
codegen_6b_temp_0_4,Base + Extra,0.22030487804878046,0.3966339054262196,0.5767249707903119
codegen_6b_temp_0_4,PropertyEval,0.21228658536585365,0.3865065780351637,0.5715664078286138
codegen_6b_temp_0_6,Base,0.23896341463414633,0.46821333877312676,0.7061758973869926
codegen_6b_temp_0_6,Base + Extra,0.20121951219512196,0.41512170609232374,0.634240619314695
codegen_6b_temp_0_6,PropertyEval,0.19597560975609757,0.40515442151547415,0.6309982963570373
codegen_6b_temp_0_8,Base,0.20030487804878044,0.4516295095407938,0.7318607050735717
codegen_6b_temp_0_8,Base + Extra,0.16664634146341462,0.39614478033587747,0.6570035168202824
codegen_6b_temp_0_8,PropertyEval,0.16353658536585367,0.3818780681647306,0.6385550800635764
gpt_4_temp_0_0,Base,0.8841463414634146
gpt_4_temp_0_0,Base + Extra,0.7865853658536586
gpt_4_temp_0_0,PropertyEval,0.7621951219512195
gpt_j_temp_0_0,Base,0.12195121951219512
gpt_j_temp_0_0,Base + Extra,0.10365853658536585
gpt_j_temp_0_0,PropertyEval,0.10365853658536585
gpt_j_temp_0_2,Base,0.11307926829268292,0.1508270378518113,0.1913684275023176
gpt_j_temp_0_2,Base + Extra,0.09484756097560976,0.11898027381716011,0.14867018016808548
gpt_j_temp_0_2,PropertyEval,0.09442073170731707,0.12202489156086159,0.14867017012271497
gpt_j_temp_0_4,Base,0.10012195121951219,0.17010807199168446,0.27230301719707434
gpt_j_temp_0_4,Base + Extra,0.08365853658536584,0.1402863099155565,0.2218646478839622
gpt_j_temp_0_4,PropertyEval,0.08469512195121952,0.1386195987593862,0.21438286278733598
gpt_j_temp_0_6,Base,0.08664634146341461,0.17702651381318923,0.31766485222027996
gpt_j_temp_0_6,Base + Extra,0.07250000000000001,0.15333631385902147,0.2676499657491822
gpt_j_temp_0_6,PropertyEval,0.07298780487804878,0.1482412281120303,0.25511460270114894
gpt_j_temp_0_8,Base,0.0714939024390244,0.17201723721281842,0.31334624404073647
gpt_j_temp_0_8,Base + Extra,0.05890243902439025,0.14821722203710186,0.25781102805526157
gpt_j_temp_0_8,PropertyEval,0.05969512195121951,0.14451424808574795,0.24359745410181388
gptneo_2b_temp_0_0,Base,0.07926829268292683
gptneo_2b_temp_0_0,Base + Extra,0.06707317073170732
gptneo_2b_temp_0_0,PropertyEval,0.06707317073170732
gptneo_2b_temp_0_2,Base,0.06451219512195122,0.10457459883900282,0.12632570718403904
gptneo_2b_temp_0_2,Base + Extra,0.05951219512195121,0.07980215137381683,0.08976563826829309
gptneo_2b_temp_0_2,PropertyEval,0.05560975609756098,0.07956181102900556,0.08976563826829309
gptneo_2b_temp_0_4,Base,0.05509146341463415,0.10984068364553934,0.1627554938579478
gptneo_2b_temp_0_4,Base + Extra,0.04963414634146342,0.08454521271318469,0.11787721281292263
gptneo_2b_temp_0_4,PropertyEval,0.04807926829268293,0.08483751013016733,0.12344468458954741
gptneo_2b_temp_0_6,Base,0.046371951219512195,0.11785057428618914,0.2099640624266031
gptneo_2b_temp_0_6,Base + Extra,0.04033536585365854,0.09261916513896634,0.17276746272891785
gptneo_2b_temp_0_6,PropertyEval,0.03939024390243903,0.09179335340179792,0.1697195980312219
gptneo_2b_temp_0_8,Base,0.03670731707317074,0.10563596259449773,0.19304227828407405
gptneo_2b_temp_0_8,Base + Extra,0.03185975609756098,0.08656989696921744,0.15987588941488498
gptneo_2b_temp_0_8,PropertyEval,0.03103658536585367,0.08491928056163861,0.15491394354337396
incoder_1b_temp_0_0,Base,0.12195121951219512
incoder_1b_temp_0_0,Base + Extra,0.10365853658536585
incoder_1b_temp_0_0,PropertyEval,0.10975609756097561
incoder_1b_temp_0_2,Base,0.0998780487804878,0.1460162386612593,0.18918597221387565
incoder_1b_temp_0_2,Base + Extra,0.08338414634146342,0.12277997338617132,0.15600417973045405
incoder_1b_temp_0_2,PropertyEval,0.08670731707317073,0.12836454011183668,0.1567707766152975
incoder_1b_temp_0_4,Base,0.0842987804878049,0.15635273470116667,0.23973570916610662
incoder_1b_temp_0_4,Base + Extra,0.07003048780487804,0.13779921810649684,0.20295464046222642
incoder_1b_temp_0_4,PropertyEval,0.07259146341463416,0.14107092090247636,0.20506423182635766
incoder_1b_temp_0_6,Base,0.07085365853658537,0.1590490563729548,0.2519564518995759
incoder_1b_temp_0_6,Base + Extra,0.05780487804878049,0.13888884833215853,0.20561538792962747
incoder_1b_temp_0_6,PropertyEval,0.060243902439024395,0.141128195219768,0.2086647282499775
incoder_1b_temp_0_8,Base,0.052469512195121956,0.14148302164046533,0.22057405467833358
incoder_1b_temp_0_8,Base + Extra,0.04402439024390243,0.12307622050094309,0.18965071012527035
incoder_1b_temp_0_8,PropertyEval,0.04579268292682927,0.12375911417325434,0.18097448292889887
incoder_6b_temp_0_0,Base,0.15853658536585366
incoder_6b_temp_0_0,Base + Extra,0.11585365853658537
incoder_6b_temp_0_0,PropertyEval,0.11585365853658537
incoder_6b_temp_0_2,Base,0.15603658536585366,0.25444807978796663,0.3258685801111753
incoder_6b_temp_0_2,Base + Extra,0.12378048780487805,0.20297484339425725,0.26715746475554636
incoder_6b_temp_0_2,PropertyEval,0.1211890243902439,0.19907915551452313,0.2676538060221093
incoder_6b_temp_0_4,Base,0.13704268292682928,0.27732655729365996,0.41654066023546255
incoder_6b_temp_0_4,Base + Extra,0.10841463414634148,0.22270646850686082,0.33597692942454765
incoder_6b_temp_0_4,PropertyEval,0.11076219512195122,0.2223719993583674,0.33369655607822696
incoder_6b_temp_0_6,Base,0.11439024390243906,0.2749988164799022,0.4504387165564537
incoder_6b_temp_0_6,Base + Extra,0.09082317073170733,0.22640799773729448,0.3963213598496223
incoder_6b_temp_0_6,PropertyEval,0.09576219512195124,0.2268778324787129,0.38569775194725353
incoder_6b_temp_0_8,Base,0.09301829268292683,0.24096861037831635,0.42096421080679225
incoder_6b_temp_0_8,Base + Extra,0.07429878048780489,0.19957132978935532,0.34865423701550596
incoder_6b_temp_0_8,PropertyEval,0.07884146341463416,0.19922155984591924,0.3440403158524318
polycoder_temp_0_0,Base,0.06097560975609756
polycoder_temp_0_0,Base + Extra,0.054878048780487805
polycoder_temp_0_0,PropertyEval,0.04878048780487805
polycoder_temp_0_2,Base,0.05911585365853659,0.08675138660930101,0.10212109736096764
polycoder_temp_0_2,Base + Extra,0.05253048780487805,0.06512759241759362,0.07280098976984123
polycoder_temp_0_2,PropertyEval,0.0486280487804878,0.069215936769349,0.07889855066971567
polycoder_temp_0_4,Base,0.055060975609756105,0.10283815624277001,0.15543590955197406
polycoder_temp_0_4,Base + Extra,0.04902439024390245,0.08091292909683472,0.1108974172428151
polycoder_temp_0_4,PropertyEval,0.046128048780487804,0.08395050269334375,0.11661386130561524
polycoder_temp_0_6,Base,0.04911585365853658,0.09896099957762369,0.1707426896698936
polycoder_temp_0_6,Base + Extra,0.04265243902439024,0.08253853574414888,0.1400501984512652
polycoder_temp_0_6,PropertyEval,0.04240853658536586,0.08296325732801979,0.14563925598991848
polycoder_temp_0_8,Base,0.03969512195121951,0.09498032103443357,0.16376014207262327
polycoder_temp_0_8,Base + Extra,0.034176829268292686,0.07887653980175204,0.12488189021993522
polycoder_temp_0_8,PropertyEval,0.03310975609756098,0.07709833974722033,0.12404062295076553
santacoder_temp_0_0,Base,0.14634146341463414
santacoder_temp_0_0,Base + Extra,0.12804878048780488
santacoder_temp_0_0,PropertyEval,0.12804878048780488
santacoder_temp_0_2,Base,0.16134146341463415,0.22466389963237055,0.28322561938993623
santacoder_temp_0_2,Base + Extra,0.13731707317073172,0.19556184834248672,0.25178708976988
santacoder_temp_0_2,PropertyEval,0.13746951219512193,0.19574920656379552,0.24815698555311713
santacoder_temp_0_4,Base,0.16603658536585367,0.27974253154473244,0.38446740682228453
santacoder_temp_0_4,Base + Extra,0.139390243902439,0.24098356832985038,0.3237312346503333
santacoder_temp_0_4,PropertyEval,0.14030487804878047,0.240798877400267,0.32914215430730537
santacoder_temp_0_6,Base,0.16073170731707317,0.2918108897178632,0.4436391142504798
santacoder_temp_0_6,Base + Extra,0.13420731707317074,0.25616414863417275,0.3890016285411586
santacoder_temp_0_6,PropertyEval,0.13402439024390245,0.25061440994214723,0.37947099240821003
santacoder_temp_0_8,Base,0.1401219512195122,0.2824622158266931,0.45403474871635385
santacoder_temp_0_8,Base + Extra,0.11579268292682927,0.2464192911926084,0.3996906768129214
santacoder_temp_0_8,PropertyEval,0.11615853658536586,0.2408419406219469,0.38421488511665847
stablelm_7b_temp_0_0,Base,0.024390243902439025
stablelm_7b_temp_0_0,Base + Extra,0.024390243902439025
stablelm_7b_temp_0_0,PropertyEval,0.018292682926829267
stablelm_7b_temp_0_2,Base,0.02713414634146342,0.053924002841013875,0.07007909757812494
stablelm_7b_temp_0_2,Base + Extra,0.0263109756097561,0.048984517799643405,0.060932756128726256
stablelm_7b_temp_0_2,PropertyEval,0.020701219512195126,0.04288695682403893,0.0548351951531165
stablelm_7b_temp_0_4,Base,0.024298780487804882,0.06788537222015664,0.12200393702618333
stablelm_7b_temp_0_4,Base + Extra,0.02292682926829269,0.06023326166396012,0.09798159335062093
stablelm_7b_temp_0_4,PropertyEval,0.019603658536585366,0.05432355970657844,0.09188403240175427
stablelm_7b_temp_0_6,Base,0.02121951219512196,0.07478031487965206,0.15819424065447693
stablelm_7b_temp_0_6,Base + Extra,0.019329268292682937,0.06587079031830519,0.12963795440187736
stablelm_7b_temp_0_6,PropertyEval,0.017743902439024396,0.060735238709216786,0.12431405943899274
stablelm_7b_temp_0_8,Base,0.015274390243902449,0.05945038669903133,0.13840394416371257
stablelm_7b_temp_0_8,Base + Extra,0.013414634146341461,0.053038041123005863,0.11320767460523766
stablelm_7b_temp_0_8,PropertyEval,0.013140243902439029,0.0486912050511292,0.11320767460541765
starcoder_temp_0_0,Base,0.34146341463414637
starcoder_temp_0_0,Base + Extra,0.2926829268292683
starcoder_temp_0_0,PropertyEval,0.27439024390243905
starcoder_temp_0_2,Base,0.32201219512195123,0.44610516389578075,0.5165312329672557
starcoder_temp_0_2,Base + Extra,0.27554878048780485,0.3914188467050528,0.467907143137772
starcoder_temp_0_2,PropertyEval,0.2600304878048781,0.3724967311166524,0.4534040676682498
starcoder_temp_0_4,Base,0.2963719512195122,0.5045721375852461,0.6528838011573476
starcoder_temp_0_4,Base + Extra,0.25359756097560976,0.4467973131103498,0.5766471102601347
starcoder_temp_0_4,PropertyEval,0.2419817073170732,0.43243190453586744,0.5783988796083672
starcoder_temp_0_6,Base,0.2760365853658537,0.5589993429144765,0.783350015469578
starcoder_temp_0_6,Base + Extra,0.23460365853658538,0.5018802562791896,0.7136094624705627
starcoder_temp_0_6,PropertyEval,0.2270426829268293,0.4888710928764058,0.7097546900891775
starcoder_temp_0_8,Base,0.24551829268292683,0.567426913139156,0.8447041523713169
starcoder_temp_0_8,Base + Extra,0.2041158536585366,0.5006358972129966,0.7562203871572232
starcoder_temp_0_8,PropertyEval,0.20073170731707318,0.4896789497823712,0.7589498480574767
vicuna_13b_temp_0_0,Base,0.16463414634146342
vicuna_13b_temp_0_0,Base + Extra,0.1524390243902439
vicuna_13b_temp_0_0,PropertyEval,0.1402439024390244
vicuna_13b_temp_0_2,Base,0.1531707317073171,0.2162586334945298,0.26380931697932547
vicuna_13b_temp_0_2,Base + Extra,0.13856707317073172,0.1937507511130478,0.2263006409432657
vicuna_13b_temp_0_2,PropertyEval,0.1273170731707317,0.18138450941078949,0.21410496118438824
vicuna_13b_temp_0_4,Base,0.14640243902439024,0.2504807867962977,0.3650877948691359
vicuna_13b_temp_0_4,Base + Extra,0.12948170731707317,0.2135518986468762,0.3079594163255997
vicuna_13b_temp_0_4,PropertyEval,0.11871951219512196,0.201201211966963,0.2926914635749006
vicuna_13b_temp_0_6,Base,0.14179878048780487,0.2810665500588924,0.48306742270045955
vicuna_13b_temp_0_6,Base + Extra,0.12317073170731709,0.2402851770641461,0.42237841781550717
vicuna_13b_temp_0_6,PropertyEval,0.11448170731707319,0.22888585880652565,0.40674979547012563
vicuna_13b_temp_0_8,Base,0.13198170731707318,0.30186939835902055,0.5504342290635061
vicuna_13b_temp_0_8,Base + Extra,0.11359756097560975,0.2570331283529767,0.46529885522380016
vicuna_13b_temp_0_8,PropertyEval,0.10692073170731707,0.2470821375196795,0.45202990354647515
vicuna_7b_temp_0_0,Base,0.11585365853658537
vicuna_7b_temp_0_0,Base + Extra,0.10975609756097561
vicuna_7b_temp_0_0,PropertyEval,0.0975609756097561
vicuna_7b_temp_0_2,Base,0.10908536585365854,0.1826325458248369,0.25081597344760115
vicuna_7b_temp_0_2,Base + Extra,0.1022560975609756,0.16243560915190977,0.2035023516738167
vicuna_7b_temp_0_2,PropertyEval,0.09496951219512195,0.15377903007541557,0.20274886215419988
vicuna_7b_temp_0_4,Base,0.10667682926829267,0.20853222484543427,0.30879983649042875
vicuna_7b_temp_0_4,Base + Extra,0.09820121951219514,0.1788946796111632,0.23775830165461123
vicuna_7b_temp_0_4,PropertyEval,0.09246951219512195,0.17435283859674144,0.2408068296288936
vicuna_7b_temp_0_6,Base,0.10417682926829269,0.23820144535452104,0.4230643400407329
vicuna_7b_temp_0_6,Base + Extra,0.09414634146341465,0.20083785999229783,0.3440524500538898
vicuna_7b_temp_0_6,PropertyEval,0.08896341463414636,0.1971722460878441,0.34690276917280993
vicuna_7b_temp_0_8,Base,0.09414634146341463,0.23475904395988687,0.3967872531210225
vicuna_7b_temp_0_8,Base + Extra,0.08359756097560975,0.19816266586433515,0.32152057254123506
vicuna_7b_temp_0_8,PropertyEval,0.07948170731707317,0.19542015427249465,0.3241871321783516