Spaces:
Running
Running
lixuejing
commited on
Commit
·
72d4c29
1
Parent(s):
b8b086c
fix
Browse files- src/display/utils.py +46 -46
src/display/utils.py
CHANGED
@@ -138,49 +138,49 @@ NUMERIC_INTERVALS = {
|
|
138 |
}
|
139 |
|
140 |
# Define the baselines
|
141 |
-
baseline_row = {
|
142 |
-
AutoEvalColumn.model.name: "<p>Baseline</p>",
|
143 |
-
AutoEvalColumn.revision.name: "N/A",
|
144 |
-
AutoEvalColumn.precision.name: None,
|
145 |
-
AutoEvalColumn.average.name: 92.75,
|
146 |
-
#AutoEvalColumn.merged.name: False,
|
147 |
-
AutoEvalColumn.CMMMU.name: 100,
|
148 |
-
AutoEvalColumn.MMMU.name: 100,
|
149 |
-
AutoEvalColumn.MMMU_Pro_standard.name: 100,
|
150 |
-
AutoEvalColumn.MMMU_Pro_vision.name: 100,
|
151 |
-
AutoEvalColumn.MathVision.name: 100,
|
152 |
-
AutoEvalColumn.CII_Bench.name: 100,
|
153 |
-
AutoEvalColumn.Blink.name: 100,
|
154 |
-
AutoEvalColumn.CharXiv.name: 100,
|
155 |
-
AutoEvalColumn.MathVerse.name: 100,
|
156 |
-
AutoEvalColumn.MmvetV2.name: 100,
|
157 |
-
AutoEvalColumn.Ocrlite.name: 100,
|
158 |
-
AutoEvalColumn.OcrliteZh.name: 100,
|
159 |
-
AutoEvalColumn.dummy.name: "baseline",
|
160 |
-
AutoEvalColumn.model_type.name: "",
|
161 |
-
AutoEvalColumn.flagged.name: False,
|
162 |
-
}
|
163 |
-
|
164 |
-
|
165 |
-
human_baseline_row = {
|
166 |
-
AutoEvalColumn.model.name: "<p>Human performance</p>",
|
167 |
-
AutoEvalColumn.revision.name: "N/A",
|
168 |
-
AutoEvalColumn.precision.name: None,
|
169 |
-
AutoEvalColumn.average.name: 92.75,
|
170 |
-
#AutoEvalColumn.merged.name: False,
|
171 |
-
AutoEvalColumn.CMMMU.name: 100,
|
172 |
-
AutoEvalColumn.MMMU.name: 100,
|
173 |
-
AutoEvalColumn.MMMU_Pro_standard.name: 100,
|
174 |
-
AutoEvalColumn.MMMU_Pro_vision.name: 100,
|
175 |
-
AutoEvalColumn.MathVision.name: 100,
|
176 |
-
AutoEvalColumn.CII_Bench.name: 100,
|
177 |
-
AutoEvalColumn.Blink.name: 100,
|
178 |
-
AutoEvalColumn.CharXiv.name: 100,
|
179 |
-
AutoEvalColumn.MathVerse.name: 100,
|
180 |
-
AutoEvalColumn.MmvetV2.name: 100,
|
181 |
-
AutoEvalColumn.Ocrlite.name: 100,
|
182 |
-
AutoEvalColumn.OcrliteZh.name: 100,
|
183 |
-
AutoEvalColumn.dummy.name: "human_baseline",
|
184 |
-
AutoEvalColumn.model_type.name: "",
|
185 |
-
AutoEvalColumn.flagged.name: False,
|
186 |
-
}
|
|
|
138 |
}
|
139 |
|
140 |
# Define the baselines
|
141 |
+
#baseline_row = {
|
142 |
+
# AutoEvalColumn.model.name: "<p>Baseline</p>",
|
143 |
+
# AutoEvalColumn.revision.name: "N/A",
|
144 |
+
# AutoEvalColumn.precision.name: None,
|
145 |
+
# AutoEvalColumn.average.name: 92.75,
|
146 |
+
# #AutoEvalColumn.merged.name: False,
|
147 |
+
# AutoEvalColumn.CMMMU.name: 100,
|
148 |
+
# AutoEvalColumn.MMMU.name: 100,
|
149 |
+
# AutoEvalColumn.MMMU_Pro_standard.name: 100,
|
150 |
+
# AutoEvalColumn.MMMU_Pro_vision.name: 100,
|
151 |
+
# AutoEvalColumn.MathVision.name: 100,
|
152 |
+
# AutoEvalColumn.CII_Bench.name: 100,
|
153 |
+
# AutoEvalColumn.Blink.name: 100,
|
154 |
+
# AutoEvalColumn.CharXiv.name: 100,
|
155 |
+
# AutoEvalColumn.MathVerse.name: 100,
|
156 |
+
# AutoEvalColumn.MmvetV2.name: 100,
|
157 |
+
# AutoEvalColumn.Ocrlite.name: 100,
|
158 |
+
# AutoEvalColumn.OcrliteZh.name: 100,
|
159 |
+
# AutoEvalColumn.dummy.name: "baseline",
|
160 |
+
# AutoEvalColumn.model_type.name: "",
|
161 |
+
# AutoEvalColumn.flagged.name: False,
|
162 |
+
#}
|
163 |
+
#
|
164 |
+
## Define the human baselines
|
165 |
+
#human_baseline_row = {
|
166 |
+
# AutoEvalColumn.model.name: "<p>Human performance</p>",
|
167 |
+
# AutoEvalColumn.revision.name: "N/A",
|
168 |
+
# AutoEvalColumn.precision.name: None,
|
169 |
+
# AutoEvalColumn.average.name: 92.75,
|
170 |
+
# #AutoEvalColumn.merged.name: False,
|
171 |
+
# AutoEvalColumn.CMMMU.name: 100,
|
172 |
+
# AutoEvalColumn.MMMU.name: 100,
|
173 |
+
# AutoEvalColumn.MMMU_Pro_standard.name: 100,
|
174 |
+
# AutoEvalColumn.MMMU_Pro_vision.name: 100,
|
175 |
+
# AutoEvalColumn.MathVision.name: 100,
|
176 |
+
# AutoEvalColumn.CII_Bench.name: 100,
|
177 |
+
# AutoEvalColumn.Blink.name: 100,
|
178 |
+
# AutoEvalColumn.CharXiv.name: 100,
|
179 |
+
# AutoEvalColumn.MathVerse.name: 100,
|
180 |
+
# AutoEvalColumn.MmvetV2.name: 100,
|
181 |
+
# AutoEvalColumn.Ocrlite.name: 100,
|
182 |
+
# AutoEvalColumn.OcrliteZh.name: 100,
|
183 |
+
# AutoEvalColumn.dummy.name: "human_baseline",
|
184 |
+
# AutoEvalColumn.model_type.name: "",
|
185 |
+
# AutoEvalColumn.flagged.name: False,
|
186 |
+
#}
|