taesiri commited on
Commit
c8b7025
·
1 Parent(s): 0ec0046
Files changed (38) hide show
  1. .gitattributes +36 -0
  2. app.py +22 -3
  3. results_qwen/CodeLlama-70b-Instruct-hf.csv +3 -0
  4. results_qwen/CodeLlama-70b-Instruct-hf.jpg +3 -0
  5. results_qwen/CodeLlama-70b-Instruct-hf.pkl +3 -0
  6. results_qwen/CodeLlama-70b-Instruct-hf.png +3 -0
  7. results_qwen/Mixtral-8x7B-Instruct-v0.1.csv +3 -0
  8. results_qwen/Mixtral-8x7B-Instruct-v0.1.jpg +3 -0
  9. results_qwen/Mixtral-8x7B-Instruct-v0.1.pkl +3 -0
  10. results_qwen/Mixtral-8x7B-Instruct-v0.1.png +3 -0
  11. results_qwen/claude-3-haiku-20240307.csv +3 -0
  12. results_qwen/claude-3-haiku-20240307.jpg +3 -0
  13. results_qwen/claude-3-haiku-20240307.pkl +3 -0
  14. results_qwen/claude-3-haiku-20240307.png +3 -0
  15. results_qwen/claude-3-opus-20240229.csv +3 -0
  16. results_qwen/claude-3-opus-20240229.jpg +3 -0
  17. results_qwen/claude-3-opus-20240229.pkl +3 -0
  18. results_qwen/claude-3-opus-20240229.png +3 -0
  19. results_qwen/deepseek-llm-67b-chat.csv +3 -0
  20. results_qwen/deepseek-llm-67b-chat.jpg +3 -0
  21. results_qwen/deepseek-llm-67b-chat.pkl +3 -0
  22. results_qwen/deepseek-llm-67b-chat.png +3 -0
  23. results_qwen/gemma-7b-it.csv +3 -0
  24. results_qwen/gemma-7b-it.jpg +3 -0
  25. results_qwen/gemma-7b-it.pkl +3 -0
  26. results_qwen/gemma-7b-it.png +3 -0
  27. results_qwen/gpt-3.5-turbo-0125.csv +3 -0
  28. results_qwen/gpt-3.5-turbo-0125.jpg +3 -0
  29. results_qwen/gpt-3.5-turbo-0125.pkl +3 -0
  30. results_qwen/gpt-3.5-turbo-0125.png +3 -0
  31. results_qwen/gpt-4-0125-preview.csv +3 -0
  32. results_qwen/gpt-4-0125-preview.jpg +3 -0
  33. results_qwen/gpt-4-0125-preview.pkl +3 -0
  34. results_qwen/gpt-4-0125-preview.png +3 -0
  35. results_qwen/gpt-4-turbo-2024-04-09.csv +3 -0
  36. results_qwen/gpt-4-turbo-2024-04-09.jpg +3 -0
  37. results_qwen/gpt-4-turbo-2024-04-09.pkl +3 -0
  38. results_qwen/gpt-4-turbo-2024-04-09.png +3 -0
.gitattributes CHANGED
@@ -195,3 +195,39 @@ results/claude-3-sonnet-20240229.jpg filter=lfs diff=lfs merge=lfs -text
195
  results/claude-3-sonnet-20240229.pkl filter=lfs diff=lfs merge=lfs -text
196
  results/deepseek-llm-67b-chat.jpg filter=lfs diff=lfs merge=lfs -text
197
  results-vision/claude-3-opus-20240229.csv filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
195
  results/claude-3-sonnet-20240229.pkl filter=lfs diff=lfs merge=lfs -text
196
  results/deepseek-llm-67b-chat.jpg filter=lfs diff=lfs merge=lfs -text
197
  results-vision/claude-3-opus-20240229.csv filter=lfs diff=lfs merge=lfs -text
198
+ results_qwen/CodeLlama-70b-Instruct-hf.csv filter=lfs diff=lfs merge=lfs -text
199
+ results_qwen/claude-3-opus-20240229.png filter=lfs diff=lfs merge=lfs -text
200
+ results_qwen/gpt-4-0125-preview.png filter=lfs diff=lfs merge=lfs -text
201
+ results_qwen/gpt-4-turbo-2024-04-09.jpg filter=lfs diff=lfs merge=lfs -text
202
+ results_qwen/claude-3-haiku-20240307.csv filter=lfs diff=lfs merge=lfs -text
203
+ results_qwen/gemma-7b-it.pkl filter=lfs diff=lfs merge=lfs -text
204
+ results_qwen/gpt-4-0125-preview.csv filter=lfs diff=lfs merge=lfs -text
205
+ results_qwen/gpt-4-0125-preview.pkl filter=lfs diff=lfs merge=lfs -text
206
+ results_qwen/CodeLlama-70b-Instruct-hf.jpg filter=lfs diff=lfs merge=lfs -text
207
+ results_qwen/Mixtral-8x7B-Instruct-v0.1.jpg filter=lfs diff=lfs merge=lfs -text
208
+ results_qwen/deepseek-llm-67b-chat.pkl filter=lfs diff=lfs merge=lfs -text
209
+ results_qwen/gemma-7b-it.jpg filter=lfs diff=lfs merge=lfs -text
210
+ results_qwen/gemma-7b-it.png filter=lfs diff=lfs merge=lfs -text
211
+ results_qwen/gpt-3.5-turbo-0125.pkl filter=lfs diff=lfs merge=lfs -text
212
+ results_qwen/Mixtral-8x7B-Instruct-v0.1.pkl filter=lfs diff=lfs merge=lfs -text
213
+ results_qwen/gpt-4-0125-preview.jpg filter=lfs diff=lfs merge=lfs -text
214
+ results_qwen/gpt-4-turbo-2024-04-09.csv filter=lfs diff=lfs merge=lfs -text
215
+ results_qwen/gpt-4-turbo-2024-04-09.png filter=lfs diff=lfs merge=lfs -text
216
+ results_qwen/Mixtral-8x7B-Instruct-v0.1.csv filter=lfs diff=lfs merge=lfs -text
217
+ results_qwen/Mixtral-8x7B-Instruct-v0.1.png filter=lfs diff=lfs merge=lfs -text
218
+ results_qwen/claude-3-haiku-20240307.pkl filter=lfs diff=lfs merge=lfs -text
219
+ results_qwen/claude-3-haiku-20240307.png filter=lfs diff=lfs merge=lfs -text
220
+ results_qwen/claude-3-opus-20240229.jpg filter=lfs diff=lfs merge=lfs -text
221
+ results_qwen/deepseek-llm-67b-chat.csv filter=lfs diff=lfs merge=lfs -text
222
+ results_qwen/CodeLlama-70b-Instruct-hf.pkl filter=lfs diff=lfs merge=lfs -text
223
+ results_qwen/deepseek-llm-67b-chat.jpg filter=lfs diff=lfs merge=lfs -text
224
+ results_qwen/gpt-3.5-turbo-0125.csv filter=lfs diff=lfs merge=lfs -text
225
+ results_qwen/claude-3-opus-20240229.csv filter=lfs diff=lfs merge=lfs -text
226
+ results_qwen/claude-3-opus-20240229.pkl filter=lfs diff=lfs merge=lfs -text
227
+ results_qwen/gemma-7b-it.csv filter=lfs diff=lfs merge=lfs -text
228
+ results_qwen/gpt-3.5-turbo-0125.jpg filter=lfs diff=lfs merge=lfs -text
229
+ results_qwen/gpt-3.5-turbo-0125.png filter=lfs diff=lfs merge=lfs -text
230
+ results_qwen/gpt-4-turbo-2024-04-09.pkl filter=lfs diff=lfs merge=lfs -text
231
+ results_qwen/CodeLlama-70b-Instruct-hf.png filter=lfs diff=lfs merge=lfs -text
232
+ results_qwen/claude-3-haiku-20240307.jpg filter=lfs diff=lfs merge=lfs -text
233
+ results_qwen/deepseek-llm-67b-chat.png filter=lfs diff=lfs merge=lfs -text
app.py CHANGED
@@ -15,7 +15,8 @@ import pandas as pd
15
 
16
 
17
  # Load text benchmark results
18
- csv_results = glob("results/*.pkl")
 
19
  # Load vision benchmark results
20
  vision_results = glob("results-vision/*.pkl")
21
  # Load CoT text benchmark results
@@ -36,7 +37,7 @@ def load_data(files, model_type):
36
 
37
 
38
  # Load and label all data
39
- data = load_data(csv_results, "Text Only")
40
  vision_data = load_data(vision_results, "Vision")
41
  cot_text_data = load_data(cot_text_results, "CoT Text Only")
42
  # cot_vision_data = load_data(cot_vision_results, "CoT Vision")
@@ -61,7 +62,7 @@ text_only_filtered_raw_cot = None
61
 
62
 
63
  # Load the csv files into a dict with keys being name of the file and values being the data
64
- data = {file: pd.read_pickle(file) for file in csv_results}
65
  # Load the vision files into a dict
66
  vision_data = {file: pd.read_pickle(file) for file in vision_results}
67
  # Load the CoT text files into a dict
@@ -69,6 +70,8 @@ cot_text_data = {file: pd.read_pickle(file) for file in cot_text_results}
69
  # Load the CoT vision files into a dict
70
  # cot_vision_data = {file: pd.read_pickle(file) for file in cot_vision_results}
71
 
 
 
72
 
73
  intersection_df = pd.read_pickle(
74
  "./intersection_results/gpt-3.5-judge-by_Qwen_5times_intersection_subset_1.pkl"
@@ -124,12 +127,15 @@ def process_data(data):
124
 
125
  # Process all data
126
  text_data_for_df = process_data(data)
 
 
127
  vision_data_for_df = process_data(vision_data)
128
  cot_text_data_for_df = process_data(cot_text_data)
129
  # cot_vision_data_for_df = process_data(cot_vision_data)
130
 
131
  # Create DataFrames
132
  accuracy_df = pd.DataFrame(text_data_for_df, columns=column_names)
 
133
  vision_accuracy_df = pd.DataFrame(vision_data_for_df, columns=column_names)
134
  cot_text_accuracy_df = pd.DataFrame(cot_text_data_for_df, columns=column_names)
135
  # cot_vision_accuracy_df = pd.DataFrame(cot_vision_data_for_df, columns=column_names)
@@ -146,6 +152,7 @@ def finalize_df(df):
146
 
147
  # Finalize all DataFrames
148
  accuracy_df = finalize_df(accuracy_df)
 
149
  vision_accuracy_df = finalize_df(vision_accuracy_df)
150
  cot_text_accuracy_df = finalize_df(cot_text_accuracy_df)
151
  # cot_vision_accuracy_df = finalize_df(cot_vision_accuracy_df)
@@ -156,6 +163,11 @@ def load_heatmap(evt: gr.SelectData):
156
  return heatmap_image
157
 
158
 
 
 
 
 
 
159
  def load_vision_heatmap(evt: gr.SelectData):
160
  heatmap_image = gr.Image(f"results-vision/{evt.value}.jpg")
161
  return heatmap_image
@@ -430,6 +442,13 @@ with gr.Blocks() as demo:
430
  heatmap_image = gr.Image(label="", show_label=False)
431
  leader_board.select(fn=load_heatmap, outputs=[heatmap_image])
432
 
 
 
 
 
 
 
 
433
  with gr.Tab("Vision Benchmark"):
434
  gr.Markdown("# Vision Benchmark Leaderboard")
435
  leader_board_vision = gr.Dataframe(
 
15
 
16
 
17
  # Load text benchmark results
18
+ noncot_results = glob("results/*.pkl")
19
+ noncot_results_qwen = glob("results_qwen/*.pkl")
20
  # Load vision benchmark results
21
  vision_results = glob("results-vision/*.pkl")
22
  # Load CoT text benchmark results
 
37
 
38
 
39
  # Load and label all data
40
+ data = load_data(noncot_results, "Text Only")
41
  vision_data = load_data(vision_results, "Vision")
42
  cot_text_data = load_data(cot_text_results, "CoT Text Only")
43
  # cot_vision_data = load_data(cot_vision_results, "CoT Vision")
 
62
 
63
 
64
  # Load the csv files into a dict with keys being name of the file and values being the data
65
+ data = {file: pd.read_pickle(file) for file in noncot_results}
66
  # Load the vision files into a dict
67
  vision_data = {file: pd.read_pickle(file) for file in vision_results}
68
  # Load the CoT text files into a dict
 
70
  # Load the CoT vision files into a dict
71
  # cot_vision_data = {file: pd.read_pickle(file) for file in cot_vision_results}
72
 
73
+ data_qwen = {file: pd.read_pickle(file) for file in noncot_results_qwen}
74
+
75
 
76
  intersection_df = pd.read_pickle(
77
  "./intersection_results/gpt-3.5-judge-by_Qwen_5times_intersection_subset_1.pkl"
 
127
 
128
  # Process all data
129
  text_data_for_df = process_data(data)
130
+ text_data_for_df_qwen = process_data(data_qwen)
131
+
132
  vision_data_for_df = process_data(vision_data)
133
  cot_text_data_for_df = process_data(cot_text_data)
134
  # cot_vision_data_for_df = process_data(cot_vision_data)
135
 
136
  # Create DataFrames
137
  accuracy_df = pd.DataFrame(text_data_for_df, columns=column_names)
138
+ accuracy_df_qwen = pd.DataFrame(text_data_for_df_qwen, columns=column_names)
139
  vision_accuracy_df = pd.DataFrame(vision_data_for_df, columns=column_names)
140
  cot_text_accuracy_df = pd.DataFrame(cot_text_data_for_df, columns=column_names)
141
  # cot_vision_accuracy_df = pd.DataFrame(cot_vision_data_for_df, columns=column_names)
 
152
 
153
  # Finalize all DataFrames
154
  accuracy_df = finalize_df(accuracy_df)
155
+ accuracy_df_qwen = finalize_df(accuracy_df_qwen)
156
  vision_accuracy_df = finalize_df(vision_accuracy_df)
157
  cot_text_accuracy_df = finalize_df(cot_text_accuracy_df)
158
  # cot_vision_accuracy_df = finalize_df(cot_vision_accuracy_df)
 
163
  return heatmap_image
164
 
165
 
166
+ def load_heatmap_qwen(evt: gr.SelectData):
167
+ heatmap_image = gr.Image(f"results_qwen/{evt.value}.jpg")
168
+ return heatmap_image
169
+
170
+
171
  def load_vision_heatmap(evt: gr.SelectData):
172
  heatmap_image = gr.Image(f"results-vision/{evt.value}.jpg")
173
  return heatmap_image
 
442
  heatmap_image = gr.Image(label="", show_label=False)
443
  leader_board.select(fn=load_heatmap, outputs=[heatmap_image])
444
 
445
+ with gr.Tab("Text-only Benchmark (Judged by Qwen)"):
446
+ gr.Markdown("# Text-only Leaderboard (Judged by Qwen)")
447
+ leader_board = gr.Dataframe(accuracy_df_qwen, headers=headers_with_icons)
448
+ gr.Markdown("## Heatmap")
449
+ heatmap_image_qwen = gr.Image(label="", show_label=False)
450
+ leader_board.select(fn=load_heatmap_qwen, outputs=[heatmap_image_qwen])
451
+
452
  with gr.Tab("Vision Benchmark"):
453
  gr.Markdown("# Vision Benchmark Leaderboard")
454
  leader_board_vision = gr.Dataframe(
results_qwen/CodeLlama-70b-Instruct-hf.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8eb9e387ef5e3ec72c0cf7f9fb69721135481977c3b2277cee5511312b8975cd
3
+ size 14962036
results_qwen/CodeLlama-70b-Instruct-hf.jpg ADDED

Git LFS Details

  • SHA256: ec863021f1f34f0dcb94379e600a79f87aff5364f35db4bf18319cfed9ace7cf
  • Pointer size: 132 Bytes
  • Size of remote file: 1.31 MB
results_qwen/CodeLlama-70b-Instruct-hf.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:203ab4a96fdca08c9155d6cec16d72eac15e35506e4ef551fa0fe8cf867c96a5
3
+ size 14974843
results_qwen/CodeLlama-70b-Instruct-hf.png ADDED

Git LFS Details

  • SHA256: 5fce36a6f9e4eb220a3fcf00c3b81089f53447c16729cba8cdd08eff6aa2796b
  • Pointer size: 132 Bytes
  • Size of remote file: 1.01 MB
results_qwen/Mixtral-8x7B-Instruct-v0.1.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b4ad69d274c473073093be7fb46a2d1070a3db35cfdfbb196a927efc2df204f
3
+ size 15659205
results_qwen/Mixtral-8x7B-Instruct-v0.1.jpg ADDED

Git LFS Details

  • SHA256: 99f126d1e67029d44ab0978fa8f60bac2a1066c7728074168edf763659b8cbfa
  • Pointer size: 132 Bytes
  • Size of remote file: 1.32 MB
results_qwen/Mixtral-8x7B-Instruct-v0.1.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:579a96d609f2bd4650a078944535c7bf2d348f9304bf627248c1a40910815452
3
+ size 15660660
results_qwen/Mixtral-8x7B-Instruct-v0.1.png ADDED

Git LFS Details

  • SHA256: 5c3e1b87d8fecd69735bb14a9f50b29e9dad36c134df633e246e65b6946de14a
  • Pointer size: 132 Bytes
  • Size of remote file: 1.01 MB
results_qwen/claude-3-haiku-20240307.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb5ca14f6f17cd4c3422e071a6e03dfc5504cb3709f5422a4b44c01daa00f57f
3
+ size 17778799
results_qwen/claude-3-haiku-20240307.jpg ADDED

Git LFS Details

  • SHA256: e4ca3f9ae806b5160a7ee69d55d4b1e607a0f2fa8018abfd178a345d4539703d
  • Pointer size: 132 Bytes
  • Size of remote file: 1.3 MB
results_qwen/claude-3-haiku-20240307.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4a38e2e7e8f22ec5c7c55561a25cd51cfe1e261f4c171e9995993b9d41bb028
3
+ size 17780948
results_qwen/claude-3-haiku-20240307.png ADDED

Git LFS Details

  • SHA256: 279f1efc22c5bf50306b8f675394e72fe763c3e345e8d8ad2b2a5e0faf6a79ac
  • Pointer size: 132 Bytes
  • Size of remote file: 1.01 MB
results_qwen/claude-3-opus-20240229.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:413814671b1a00fe6b8fa308ab8fc4e76a046799d2e275c5fe51a1606d0a5062
3
+ size 18235109
results_qwen/claude-3-opus-20240229.jpg ADDED

Git LFS Details

  • SHA256: 5a02ca8e953854fbb5538d070597e878a6af5bd202c93ad1c35ce2c6ded363bc
  • Pointer size: 132 Bytes
  • Size of remote file: 1.21 MB
results_qwen/claude-3-opus-20240229.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be62c58b6b5e21ae49bdf5ba96ad4628d959b9843a2eba691bddd9c5bd717f1d
3
+ size 18253951
results_qwen/claude-3-opus-20240229.png ADDED

Git LFS Details

  • SHA256: c199b8c8e681c485b8972025ed3488464dd166642dcac9ee150989a9c650961c
  • Pointer size: 132 Bytes
  • Size of remote file: 1.01 MB
results_qwen/deepseek-llm-67b-chat.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:668c30672d315df2c899df7627039723fc35bba099ae410792729a087a65b9fb
3
+ size 12916783
results_qwen/deepseek-llm-67b-chat.jpg ADDED

Git LFS Details

  • SHA256: c31e2ff0f6672617639ed92f33d41b96ea82d3c81590ad8f869555f7d8cbd5b6
  • Pointer size: 132 Bytes
  • Size of remote file: 1.33 MB
results_qwen/deepseek-llm-67b-chat.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e26477861326f0784a70903beadad6a4ca7dc61e18e3a76db9cc713d196dab0
3
+ size 12957786
results_qwen/deepseek-llm-67b-chat.png ADDED

Git LFS Details

  • SHA256: e7028fadc4c5172a89ff58a8074e0aa3d14eb7c343cb9dcb90a9266a6e090008
  • Pointer size: 132 Bytes
  • Size of remote file: 1.01 MB
results_qwen/gemma-7b-it.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abcf0738cde1e241535a90aae98338d1b9505a844c9561877e245b604676e489
3
+ size 11246490
results_qwen/gemma-7b-it.jpg ADDED

Git LFS Details

  • SHA256: bc4ca1f65ed04e50e3402823b7812d9f7a8080d1a2b022c2e8204ca82cbd2624
  • Pointer size: 132 Bytes
  • Size of remote file: 1.32 MB
results_qwen/gemma-7b-it.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cd2216230dadc2adf5a73a1b64c799f27913cf4033e7333290962c8926b9557
3
+ size 11301306
results_qwen/gemma-7b-it.png ADDED

Git LFS Details

  • SHA256: ed89e875f18947cd237e312dc5293e2947a1287bd63dd15197689e0bff2614a7
  • Pointer size: 132 Bytes
  • Size of remote file: 1.01 MB
results_qwen/gpt-3.5-turbo-0125.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3da618470a9256a02824d308cab84e80400ded429b9157c20b89ba720f708bb1
3
+ size 8041854
results_qwen/gpt-3.5-turbo-0125.jpg ADDED

Git LFS Details

  • SHA256: 707a882b8cdb3da1d75bfc68be6fa0de2f694a75c09e4d752d43da4a5576c6ba
  • Pointer size: 132 Bytes
  • Size of remote file: 1.33 MB
results_qwen/gpt-3.5-turbo-0125.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e224821031c0d87b38a113efff8a9100fe770d067d2d94662c81ad6207718963
3
+ size 8069783
results_qwen/gpt-3.5-turbo-0125.png ADDED

Git LFS Details

  • SHA256: 445c3dd96c469ec350c63ac2c057eea10b836eb44ae2311b487a10e82ca2ed44
  • Pointer size: 132 Bytes
  • Size of remote file: 1.01 MB
results_qwen/gpt-4-0125-preview.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd1c1982308ad0b1f510001f407bf50a9378dc94391993f4116c02beaa55c27f
3
+ size 15996843
results_qwen/gpt-4-0125-preview.jpg ADDED

Git LFS Details

  • SHA256: d24927f07dc58a6f8b4d96ba33d3bd5eb608648fbf09310ee6b899b071eb6705
  • Pointer size: 132 Bytes
  • Size of remote file: 1.23 MB
results_qwen/gpt-4-0125-preview.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d31b186ce750657cbddcabbf6998069ecf2f6631954a8718c88313564063b30
3
+ size 15985596
results_qwen/gpt-4-0125-preview.png ADDED

Git LFS Details

  • SHA256: 5f0eb9f8af0da0eb7cf438ce275255121b5ff4bedd2481ff54b5c340456621e1
  • Pointer size: 132 Bytes
  • Size of remote file: 1.01 MB
results_qwen/gpt-4-turbo-2024-04-09.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d50952850b16d84f951949aa629db60375aa2100cf86f1b9a143cdfd83fc1c30
3
+ size 16522373
results_qwen/gpt-4-turbo-2024-04-09.jpg ADDED

Git LFS Details

  • SHA256: a7596d4256d2516d20e9962a3600a60b9eeee806af6370a13e6cf05b544744e6
  • Pointer size: 132 Bytes
  • Size of remote file: 1.22 MB
results_qwen/gpt-4-turbo-2024-04-09.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:661211c67ac6a0e6168e79df8d616b4abbc7e5d0fda335736cbe22912fade1f4
3
+ size 16542716
results_qwen/gpt-4-turbo-2024-04-09.png ADDED

Git LFS Details

  • SHA256: 22fd48ef25affc68411b79985c889b9db8884083ca17688831feca9f78e03d0c
  • Pointer size: 132 Bytes
  • Size of remote file: 1.01 MB