MINGYISU commited on
Commit
1701d2a
·
verified ·
1 Parent(s): 6a03b58

upload results logs for reference

Browse files
Archive/BGE-VL-v1.5-mmeb.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "Model": "BGE-VL-v1.5 (FT; LlaVA-1.6-Mistral)",
4
+ "URL": "https://huggingface.co/BAAI/BGE-VL-v1.5-mmeb",
5
+ "Model Size(B)": 7.57,
6
+ "Data Source": "Self-Reported",
7
+ "V1-Overall": 69.4,
8
+ "I-CLS": 63.7,
9
+ "I-QA": 64.9,
10
+ "I-RET": 72.2,
11
+ "I-VG": 86.6
12
+ }
13
+ ]
Archive/BGE-VL-v1.5-zs.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "Model": "BGE-VL-v1.5 (zeroshot; LlaVA-1.6-Mistral)",
4
+ "URL": "https://huggingface.co/BAAI/BGE-VL-v1.5-zs",
5
+ "Model Size(B)": 7.57,
6
+ "Data Source": "Self-Reported",
7
+ "V1-Overall": 60.1,
8
+ "I-CLS": 56.1,
9
+ "I-QA": 55.3,
10
+ "I-RET": 63.9,
11
+ "I-VG": 70.8
12
+ }
13
+ ]
Archive/LLaVE.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "Model": "LLaVE-7B",
4
+ "URL": "https://huggingface.co/zhibinlan/LLaVE-7B",
5
+ "Model Size(B)": 8.03B,
6
+ "Data Source": "Self-Reported",
7
+ "Overall": 70.3,
8
+ "Classification": 65.7,
9
+ "VQA": 65.4,
10
+ "Retrieval": 70.9,
11
+ "Grounding": 91.9
12
+ },
13
+ {
14
+ "Model": "LLaVE-2B",
15
+ "URL": "https://huggingface.co/zhibinlan/LLaVE-2B",
16
+ "Model Size(B)": 1.95B,
17
+ "Data Source": "Self-Reported",
18
+ "Overall": 65.2,
19
+ "Classification": 62.1,
20
+ "VQA": 60.2,
21
+ "Retrieval": 65.2,
22
+ "Grounding": 84.9
23
+ },
24
+ {
25
+ "Model": "LLaVE-0.5B",
26
+ "URL": "https://huggingface.co/zhibinlan/LLaVE-0.5B",
27
+ "Model Size(B)": 894M,
28
+ "Data Source": "Self-Reported",
29
+ "Overall": 59.1,
30
+ "Classification": 57.4,
31
+ "VQA": 50.3,
32
+ "Retrieval": 59.8,
33
+ "Grounding": 82.9
34
+ },
35
+ ]
Archive/UniME_results.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "Model": "UniME(LLaVA-OneVision-7B-LoRA-Res336)",
4
+ "URL": "https://huggingface.co/DeepGlint-AI/UniME-LLaVA-OneVision-7B",
5
+ "Model Size(B)": 8.03,
6
+ "Data Source": "Self-Reported",
7
+ "Overall": 70.7,
8
+ "Classification": 66.8,
9
+ "VQA": 66.6,
10
+ "Retrieval": 70.5,
11
+ "Grounding": 90.9
12
+ },
13
+ {
14
+ "Model": "UniME(LLaVA-1.6-7B-LoRA-LowRes)",
15
+ "URL": "https://huggingface.co/DeepGlint-AI/UniME-LLaVA-1.6-7B",
16
+ "Model Size(B)": 7.57,
17
+ "Data Source": "Self-Reported",
18
+ "Overall": 66.6,
19
+ "Classification": 60.6,
20
+ "VQA": 52.9,
21
+ "Retrieval": 67.9,
22
+ "Grounding": 85.1
23
+ },
24
+ {
25
+ "Model": "UniME(Phi-3.5-V-LoRA)",
26
+ "URL": "https://huggingface.co/DeepGlint-AI/UniME-Phi3.5-V-4.2B",
27
+ "Model Size(B)": 4.2,
28
+ "Data Source": "Self-Reported",
29
+ "Overall": 64.2,
30
+ "Classification": 54.8,
31
+ "VQA": 55.9,
32
+ "Retrieval": 64.5,
33
+ "Grounding": 81.8
34
+ }
35
+ ]
Archive/meta-score-BGE-VL-v1.5-mmeb.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "Classification": {
3
+ "ImageNet-1K": 0.78,
4
+ "N24News": 0.812,
5
+ "HatefulMemes": 0.616,
6
+ "VOC2007": 0.928,
7
+ "SUN397": 0.836,
8
+ "Place365": 0.468,
9
+ "ImageNet-A": 0.449,
10
+ "ImageNet-R": 0.771,
11
+ "ObjectNet": 0.54,
12
+ "Country211": 0.172,
13
+ "avg": 0.6372
14
+ },
15
+ "VQA": {
16
+ "OK-VQA": 0.749,
17
+ "A-OKVQA": 0.599,
18
+ "DocVQA": 0.854,
19
+ "InfographicsVQA": 0.47,
20
+ "ChartQA": 0.487,
21
+ "Visual7W": 0.613,
22
+ "ScienceQA": 0.679,
23
+ "VizWiz": 0.493,
24
+ "GQA": 0.728,
25
+ "TextVQA": 0.814,
26
+ "avg": 0.6486
27
+ },
28
+ "Retrieval": {
29
+ "VisDial": 0.846,
30
+ "CIRR": 0.635,
31
+ "VisualNews_t2i": 0.787,
32
+ "VisualNews_i2t": 0.816,
33
+ "MSCOCO_t2i": 0.793,
34
+ "MSCOCO_i2t": 0.755,
35
+ "NIGHTS": 0.698,
36
+ "WebQA": 0.904,
37
+ "OVEN": 0.576,
38
+ "FashionIQ": 0.269,
39
+ "EDIS": 0.904,
40
+ "Wiki-SS-NQ": 0.676,
41
+ "avg": 0.7215833333333332
42
+ },
43
+ "Visual Grounding": {
44
+ "MSCOCO": 0.824,
45
+ "Visual7W-Pointing": 0.912,
46
+ "RefCOCO": 0.911,
47
+ "RefCOCO-Matching": 0.815,
48
+ "avg": 0.8655
49
+ },
50
+ "avg": 0.693861111111111
51
+ }
Archive/meta-score-BGE-VL-v1.5-zs.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "Classification": {
3
+ "ImageNet-1K": 0.636,
4
+ "N24News": 0.511,
5
+ "HatefulMemes": 0.51,
6
+ "VOC2007": 0.78,
7
+ "SUN397": 0.722,
8
+ "Place365": 0.431,
9
+ "ImageNet-A": 0.488,
10
+ "ImageNet-R": 0.758,
11
+ "ObjectNet": 0.618,
12
+ "Country211": 0.152,
13
+ "avg": 0.5606000000000001
14
+ },
15
+ "VQA": {
16
+ "OK-VQA": 0.642,
17
+ "A-OKVQA": 0.53,
18
+ "DocVQA": 0.688,
19
+ "InfographicsVQA": 0.319,
20
+ "ChartQA": 0.355,
21
+ "Visual7W": 0.488,
22
+ "ScienceQA": 0.462,
23
+ "VizWiz": 0.515,
24
+ "GQA": 0.755,
25
+ "TextVQA": 0.777,
26
+ "avg": 0.5531
27
+ },
28
+ "Retrieval": {
29
+ "VisDial": 0.701,
30
+ "CIRR": 0.601,
31
+ "VisualNews_t2i": 0.63,
32
+ "VisualNews_i2t": 0.669,
33
+ "MSCOCO_t2i": 0.719,
34
+ "MSCOCO_i2t": 0.63,
35
+ "NIGHTS": 0.598,
36
+ "WebQA": 0.852,
37
+ "OVEN": 0.529,
38
+ "FashionIQ": 0.246,
39
+ "EDIS": 0.807,
40
+ "Wiki-SS-NQ": 0.687,
41
+ "avg": 0.6390833333333334
42
+ },
43
+ "Visual Grounding": {
44
+ "MSCOCO": 0.521,
45
+ "Visual7W-Pointing": 0.789,
46
+ "RefCOCO": 0.74,
47
+ "RefCOCO-Matching": 0.784,
48
+ "avg": 0.7084999999999999
49
+ },
50
+ "avg": 0.6011111111111112
51
+ }
Archive/mmE5_mmeb.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "Model": "mmE5-mllama-11b-instruct",
4
+ "URL": "https://huggingface.co/intfloat/mmE5-mllama-11b-instruct",
5
+ "Model Size(B)": 10.6,
6
+ "Data Source": Self-Reported,
7
+ "Overall": 69.8,
8
+ "Classification": 67.6,
9
+ "VQA": 62.6,
10
+ "Retrieval": 71.0,
11
+ "Grounding": 89.6
12
+ },
13
+ ]
Archive/mmeb-qqmm.json ADDED
@@ -0,0 +1 @@
 
 
1
+ [{"Model": "QQMM-embed", "Model Size(B)": 8.297, "Data Source": "Self-Reported", "Overall": 72.175, "Classification": 70.07, "VQA": 69.52, "Retrieval": 71.175, "Grounding": 87.075}]