Skip to content

Commit 6995217

Browse files
committed
graphics
1 parent fe2af80 commit 6995217

File tree

1 file changed

+32
-32
lines changed

1 file changed

+32
-32
lines changed

notebooks/evaluation_experiment.ipynb

Lines changed: 32 additions & 32 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@
1010
},
1111
{
1212
"cell_type": "code",
13-
"execution_count": 33,
13+
"execution_count": 1,
1414
"metadata": {},
1515
"outputs": [],
1616
"source": [
@@ -24,7 +24,7 @@
2424
},
2525
{
2626
"cell_type": "code",
27-
"execution_count": 34,
27+
"execution_count": 2,
2828
"metadata": {},
2929
"outputs": [],
3030
"source": [
@@ -61,7 +61,7 @@
6161
},
6262
{
6363
"cell_type": "code",
64-
"execution_count": 35,
64+
"execution_count": 3,
6565
"metadata": {},
6666
"outputs": [],
6767
"source": [
@@ -183,7 +183,7 @@
183183
},
184184
{
185185
"cell_type": "code",
186-
"execution_count": 36,
186+
"execution_count": 4,
187187
"metadata": {},
188188
"outputs": [],
189189
"source": [
@@ -195,7 +195,7 @@
195195
},
196196
{
197197
"cell_type": "code",
198-
"execution_count": 37,
198+
"execution_count": 5,
199199
"metadata": {},
200200
"outputs": [],
201201
"source": [
@@ -209,7 +209,7 @@
209209
},
210210
{
211211
"cell_type": "code",
212-
"execution_count": 38,
212+
"execution_count": 6,
213213
"metadata": {},
214214
"outputs": [],
215215
"source": [
@@ -219,7 +219,7 @@
219219
},
220220
{
221221
"cell_type": "code",
222-
"execution_count": 39,
222+
"execution_count": 7,
223223
"metadata": {},
224224
"outputs": [
225225
{
@@ -244,7 +244,7 @@
244244
},
245245
{
246246
"cell_type": "code",
247-
"execution_count": 40,
247+
"execution_count": 8,
248248
"metadata": {},
249249
"outputs": [
250250
{
@@ -266,7 +266,7 @@
266266
},
267267
{
268268
"cell_type": "code",
269-
"execution_count": 41,
269+
"execution_count": 9,
270270
"metadata": {},
271271
"outputs": [
272272
{
@@ -288,7 +288,7 @@
288288
},
289289
{
290290
"cell_type": "code",
291-
"execution_count": 42,
291+
"execution_count": 10,
292292
"metadata": {},
293293
"outputs": [
294294
{
@@ -468,7 +468,7 @@
468468
"init Llama-3-70B init False 53.17 ± 17.86 "
469469
]
470470
},
471-
"execution_count": 42,
471+
"execution_count": 10,
472472
"metadata": {},
473473
"output_type": "execute_result"
474474
}
@@ -496,7 +496,7 @@
496496
},
497497
{
498498
"cell_type": "code",
499-
"execution_count": 76,
499+
"execution_count": 11,
500500
"metadata": {},
501501
"outputs": [],
502502
"source": [
@@ -509,7 +509,7 @@
509509
},
510510
{
511511
"cell_type": "code",
512-
"execution_count": 85,
512+
"execution_count": 12,
513513
"metadata": {},
514514
"outputs": [],
515515
"source": [
@@ -521,7 +521,7 @@
521521
},
522522
{
523523
"cell_type": "code",
524-
"execution_count": 86,
524+
"execution_count": 13,
525525
"metadata": {},
526526
"outputs": [
527527
{
@@ -669,7 +669,7 @@
669669
" True 64.33 ± 2.25 "
670670
]
671671
},
672-
"execution_count": 86,
672+
"execution_count": 13,
673673
"metadata": {},
674674
"output_type": "execute_result"
675675
}
@@ -682,7 +682,7 @@
682682
},
683683
{
684684
"cell_type": "code",
685-
"execution_count": 87,
685+
"execution_count": 14,
686686
"metadata": {},
687687
"outputs": [
688688
{
@@ -704,7 +704,7 @@
704704
},
705705
{
706706
"cell_type": "code",
707-
"execution_count": 88,
707+
"execution_count": 15,
708708
"metadata": {},
709709
"outputs": [
710710
{
@@ -733,7 +733,7 @@
733733
},
734734
{
735735
"cell_type": "code",
736-
"execution_count": 48,
736+
"execution_count": 16,
737737
"metadata": {},
738738
"outputs": [],
739739
"source": [
@@ -747,7 +747,7 @@
747747
},
748748
{
749749
"cell_type": "code",
750-
"execution_count": 49,
750+
"execution_count": 17,
751751
"metadata": {},
752752
"outputs": [],
753753
"source": [
@@ -762,7 +762,7 @@
762762
},
763763
{
764764
"cell_type": "code",
765-
"execution_count": 50,
765+
"execution_count": 18,
766766
"metadata": {},
767767
"outputs": [
768768
{
@@ -783,7 +783,7 @@
783783
},
784784
{
785785
"cell_type": "code",
786-
"execution_count": 51,
786+
"execution_count": 19,
787787
"metadata": {},
788788
"outputs": [
789789
{
@@ -883,7 +883,7 @@
883883
" gpt-4o DE False 51.33 ± 1.53 69.50 ± 2.60 "
884884
]
885885
},
886-
"execution_count": 51,
886+
"execution_count": 19,
887887
"metadata": {},
888888
"output_type": "execute_result"
889889
}
@@ -902,7 +902,7 @@
902902
},
903903
{
904904
"cell_type": "code",
905-
"execution_count": 62,
905+
"execution_count": 20,
906906
"metadata": {},
907907
"outputs": [
908908
{
@@ -929,7 +929,7 @@
929929
},
930930
{
931931
"cell_type": "code",
932-
"execution_count": 63,
932+
"execution_count": 21,
933933
"metadata": {},
934934
"outputs": [
935935
{
@@ -1043,7 +1043,7 @@
10431043
" GA False 68.83 ± 8.75 67.83 ± 5.77 "
10441044
]
10451045
},
1046-
"execution_count": 63,
1046+
"execution_count": 21,
10471047
"metadata": {},
10481048
"output_type": "execute_result"
10491049
}
@@ -1055,7 +1055,7 @@
10551055
},
10561056
{
10571057
"cell_type": "code",
1058-
"execution_count": 64,
1058+
"execution_count": 22,
10591059
"metadata": {},
10601060
"outputs": [
10611061
{
@@ -1082,7 +1082,7 @@
10821082
},
10831083
{
10841084
"cell_type": "code",
1085-
"execution_count": 65,
1085+
"execution_count": 23,
10861086
"metadata": {},
10871087
"outputs": [
10881088
{
@@ -1196,7 +1196,7 @@
11961196
" GA False 63.67 ± 10.05 "
11971197
]
11981198
},
1199-
"execution_count": 65,
1199+
"execution_count": 23,
12001200
"metadata": {},
12011201
"output_type": "execute_result"
12021202
}
@@ -1215,7 +1215,7 @@
12151215
},
12161216
{
12171217
"cell_type": "code",
1218-
"execution_count": 52,
1218+
"execution_count": 24,
12191219
"metadata": {},
12201220
"outputs": [],
12211221
"source": [
@@ -1231,7 +1231,7 @@
12311231
},
12321232
{
12331233
"cell_type": "code",
1234-
"execution_count": 53,
1234+
"execution_count": 25,
12351235
"metadata": {},
12361236
"outputs": [
12371237
{
@@ -1252,7 +1252,7 @@
12521252
},
12531253
{
12541254
"cell_type": "code",
1255-
"execution_count": 54,
1255+
"execution_count": 26,
12561256
"metadata": {},
12571257
"outputs": [
12581258
{
@@ -1346,7 +1346,7 @@
13461346
"init gpt-4o init False 57.17 ± 12.10 "
13471347
]
13481348
},
1349-
"execution_count": 54,
1349+
"execution_count": 26,
13501350
"metadata": {},
13511351
"output_type": "execute_result"
13521352
}

0 commit comments

Comments
 (0)