Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- all_tasks.json +34 -0
- continuous/scenario-11.json +11 -0
- continuous/scenario-12.json +11 -0
- continuous/scenario-14.json +11 -0
- continuous/scenario-18.json +11 -0
- continuous/scenario-5.json +11 -0
- continuous/scenario-8.json +11 -0
- create_scenario.py +42 -0
- disjoint/scenario-1.json +8 -0
- disjoint/scenario-10.json +11 -0
- disjoint/scenario-102.json +8 -0
- disjoint/scenario-103.json +8 -0
- disjoint/scenario-104.json +8 -0
- disjoint/scenario-105.json +8 -0
- disjoint/scenario-106.json +8 -0
- disjoint/scenario-107.json +8 -0
- disjoint/scenario-11.json +11 -0
- disjoint/scenario-12.json +11 -0
- disjoint/scenario-14.json +11 -0
- disjoint/scenario-15.json +15 -0
- disjoint/scenario-16.json +11 -0
- disjoint/scenario-17.json +14 -0
- disjoint/scenario-18.json +11 -0
- disjoint/scenario-2.json +11 -0
- disjoint/scenario-20.json +11 -0
- disjoint/scenario-22.json +11 -0
- disjoint/scenario-28.json +11 -0
- disjoint/scenario-3.json +11 -0
- disjoint/scenario-32.json +11 -0
- disjoint/scenario-38.json +11 -0
- disjoint/scenario-4.json +11 -0
- disjoint/scenario-5.json +11 -0
- disjoint/scenario-6.json +8 -0
- disjoint/scenario-7.json +12 -0
- disjoint/scenario-8.json +11 -0
- disjoint/scenario-9.json +11 -0
- fcl_scenarios/scenario-0.json +92 -0
- fcl_scenarios/scenario-1.json +14 -0
- fcl_scenarios/scenario-10.json +26 -0
- fcl_scenarios/scenario-2.json +26 -0
- fcl_scenarios/scenario-20.json +92 -0
- fcl_scenarios/scenario-21.json +20 -0
- fcl_scenarios/scenario-22.json +38 -0
- fcl_scenarios/scenario-23.json +11 -0
- fcl_scenarios/scenario-24.json +20 -0
- fcl_scenarios/scenario-28.json +38 -0
- fcl_scenarios/scenario-29.json +38 -0
- fcl_scenarios/scenario-3.json +20 -0
- fcl_scenarios/scenario-4.json +14 -0
- fcl_scenarios/scenario-40.json +242 -0
all_tasks.json
ADDED
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{"dataset": "AQUA","subset_id": 0, "task_name": "no external knowledge"},
|
3 |
+
{"dataset": "AQUA","subset_id": 1, "task_name": "need external knowledge 1"},
|
4 |
+
{"dataset": "AQUA","subset_id": 2, "task_name": "need external knowledge 2"},
|
5 |
+
{"dataset": "Mementos","subset_id": 0},
|
6 |
+
{"dataset": "SciCap","subset_id": 0, "task_name": "Yes-subfig"},
|
7 |
+
{"dataset": "SciCap","subset_id": 1, "task_name": "No-subfig"},
|
8 |
+
{"dataset": "Bongard-OpenWorld","subset_id": 0},
|
9 |
+
{"dataset": "HRVQA","subset_id": 0, "task_name": "areas"},
|
10 |
+
{"dataset": "HRVQA","subset_id": 1, "task_name": "color"},
|
11 |
+
{"dataset": "HRVQA","subset_id": 2, "task_name": "location"},
|
12 |
+
{"dataset": "HRVQA","subset_id": 3, "task_name": "numbers"},
|
13 |
+
{"dataset": "HRVQA","subset_id": 4, "task_name": "scene"},
|
14 |
+
{"dataset": "HRVQA","subset_id": 5, "task_name": "shape"},
|
15 |
+
{"dataset": "HRVQA","subset_id": 6, "task_name": "size"},
|
16 |
+
{"dataset": "HRVQA","subset_id": 7, "task_name": "sports"},
|
17 |
+
{"dataset": "HRVQA","subset_id": 8, "task_name": "transportation"},
|
18 |
+
{"dataset": "HRVQA","subset_id": 9, "task_name": "yes no"},
|
19 |
+
{"dataset": "mPLUG","subset_id": 0, "task_name": "areas"},
|
20 |
+
{"dataset": "mPLUG","subset_id": 1, "task_name": "color"},
|
21 |
+
{"dataset": "mPLUG","subset_id": 2, "task_name": "location"},
|
22 |
+
{"dataset": "mPLUG","subset_id": 3, "task_name": "numbers"},
|
23 |
+
{"dataset": "mPLUG","subset_id": 4, "task_name": "scene"},
|
24 |
+
{"dataset": "mPLUG","subset_id": 5, "task_name": "shape"},
|
25 |
+
{"dataset": "mPLUG","subset_id": 6, "task_name": "size"},
|
26 |
+
{"dataset": "mPLUG","subset_id": 7, "task_name": "sports"},
|
27 |
+
{"dataset": "Birds-to-Words","subset_id": 0},
|
28 |
+
{"dataset": "DiDeMoSV","subset_id": 0},
|
29 |
+
{"dataset": "VIST","subset_id": 0},
|
30 |
+
{"dataset": "Describe-Diff","subset_id": 0},
|
31 |
+
{"dataset": "NLVR2","subset_id": 0},
|
32 |
+
{"dataset": "NLVR2","subset_id": 1},
|
33 |
+
{"dataset": "KGQA","subset_id": 0}
|
34 |
+
]
|
continuous/scenario-11.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "Bongard-HOI","subset_id": 150, "type":"multi-choice"},
|
6 |
+
{"dataset": "NLVR2","subset_id": 150, "type":"multi-choice"},
|
7 |
+
{"dataset": "Co-Instruct-DB","subset_id": 150, "type":"multi-choice"},
|
8 |
+
{"dataset": "TQA","subset_id": 150, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
continuous/scenario-12.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "NLVR2","subset_id": 151, "type":"multi-choice"},
|
6 |
+
{"dataset": "Bongard-HOI","subset_id": 151, "type":"multi-choice"},
|
7 |
+
{"dataset": "HQ_Edit","subset_id": 151, "type":"multi-choice"},
|
8 |
+
{"dataset": "PatternCom","subset_id": 151, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
continuous/scenario-14.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "Bongard-OpenWorld","subset_id": 153, "type":"multi-choice"},
|
6 |
+
{"dataset": "Co-Instruct-DB","subset_id": 153, "type":"multi-choice"},
|
7 |
+
{"dataset": "dvqa","subset_id": 153, "type":"multi-choice"},
|
8 |
+
{"dataset": "NLVR2","subset_id": 153, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
continuous/scenario-18.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "Bongard-OpenWorld","subset_id": 300, "type":"multi-choice"},
|
6 |
+
{"dataset": "Co-Instruct-DB","subset_id": 300, "type":"multi-choice"},
|
7 |
+
{"dataset": "dvqa","subset_id": 300, "type":"multi-choice"},
|
8 |
+
{"dataset": "HQ_Edit","subset_id": 300, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
continuous/scenario-5.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "Bongard-HOI","subset_id": 180, "type":"multi-choice"},
|
6 |
+
{"dataset": "Bongard-HOI","subset_id": 181, "type":"multi-choice"},
|
7 |
+
{"dataset": "Bongard-HOI","subset_id": 182, "type":"multi-choice"},
|
8 |
+
{"dataset": "Bongard-HOI","subset_id": 183, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
continuous/scenario-8.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "NLVR2","subset_id": 152, "type":"multi-choice"},
|
6 |
+
{"dataset": "HQ_Edit","subset_id": 152, "type":"multi-choice"},
|
7 |
+
{"dataset": "PatternCom","subset_id": 152, "type":"multi-choice"},
|
8 |
+
{"dataset": "Bongard-HOI","subset_id": 152, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
create_scenario.py
ADDED
@@ -0,0 +1,42 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import random
|
2 |
+
import os
|
3 |
+
import argparse
|
4 |
+
import json
|
5 |
+
|
6 |
+
def main():
|
7 |
+
# Create ArgumentParser object
|
8 |
+
parser = argparse.ArgumentParser()
|
9 |
+
|
10 |
+
# Add the method_name argument
|
11 |
+
parser.add_argument('--seed', type=int, default=0, help='Random seed')
|
12 |
+
parser.add_argument('--client_num', type=int, help='Number of client')
|
13 |
+
parser.add_argument('--max_task', type=int, default=4, help='Maximum number of tasks per client')
|
14 |
+
|
15 |
+
# Parse the command-line arguments
|
16 |
+
args = parser.parse_args()
|
17 |
+
|
18 |
+
random.seed(args.seed)
|
19 |
+
|
20 |
+
with open('./all_tasks.json', 'r') as fp:
|
21 |
+
task_list = json.load(fp)
|
22 |
+
|
23 |
+
print('total available tasks:', len(task_list))
|
24 |
+
|
25 |
+
max_task_per_client = min(args.max_task, len(task_list) // args.client_num)
|
26 |
+
scenario_data = []
|
27 |
+
|
28 |
+
random.shuffle(task_list)
|
29 |
+
|
30 |
+
for client_id in range(args.client_num):
|
31 |
+
scenario_data.append({
|
32 |
+
'client_id':client_id,
|
33 |
+
'datasets':task_list[client_id*max_task_per_client:(client_id+1)*max_task_per_client]
|
34 |
+
})
|
35 |
+
|
36 |
+
output_path = f'scenario_{args.client_num}clients_{max_task_per_client}tasks_seed{args.seed}.json'
|
37 |
+
|
38 |
+
with open(output_path, 'w') as json_file:
|
39 |
+
json.dump(scenario_data, json_file, indent=4)
|
40 |
+
|
41 |
+
if __name__ == "__main__":
|
42 |
+
main()
|
disjoint/scenario-1.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "HRVQA","subset_id": 100, "type":"multi-choice"}
|
6 |
+
]
|
7 |
+
}
|
8 |
+
]
|
disjoint/scenario-10.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "Co-Instruct-DB","subset_id": 0, "type":"multi-choice"},
|
6 |
+
{"dataset": "Co-Instruct-DB","subset_id": 1, "type":"multi-choice"},
|
7 |
+
{"dataset": "Co-Instruct-DB","subset_id": 2, "type":"open-ended", "metric":"RougeL"},
|
8 |
+
{"dataset": "Co-Instruct-DB","subset_id": 3, "type":"open-ended", "metric":"RougeL"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
disjoint/scenario-102.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "DreamSim","subset_id": 0, "type":"multi-choice"}
|
6 |
+
]
|
7 |
+
}
|
8 |
+
]
|
disjoint/scenario-103.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "RecipeQA_TextCloze","subset_id": 0, "type":"multi-choice"}
|
6 |
+
]
|
7 |
+
}
|
8 |
+
]
|
disjoint/scenario-104.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "MagicBrush","subset_id": 0, "type":"multi-choice"}
|
6 |
+
]
|
7 |
+
}
|
8 |
+
]
|
disjoint/scenario-105.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "COMICS_Panel","subset_id": 0, "type":"multi-choice"}
|
6 |
+
]
|
7 |
+
}
|
8 |
+
]
|
disjoint/scenario-106.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "RecipeQA_ImageCoherence","subset_id": 0, "type":"multi-choice"}
|
6 |
+
]
|
7 |
+
}
|
8 |
+
]
|
disjoint/scenario-107.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "Mantis_contrastive_caption","subset_id": 0, "type":"multi-choice"}
|
6 |
+
]
|
7 |
+
}
|
8 |
+
]
|
disjoint/scenario-11.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "Bongard-HOI","subset_id": 50, "type":"multi-choice"},
|
6 |
+
{"dataset": "NLVR2","subset_id": 0, "type":"multi-choice"},
|
7 |
+
{"dataset": "Co-Instruct-DB","subset_id": 0, "type":"multi-choice"},
|
8 |
+
{"dataset": "TQA","subset_id": 0, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
disjoint/scenario-12.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "NLVR2-2","subset_id": 0, "type":"multi-choice"},
|
6 |
+
{"dataset": "Bongard-HOI2","subset_id": 50, "type":"multi-choice"},
|
7 |
+
{"dataset": "HQ_Edit-2","subset_id": 0, "type":"multi-choice"},
|
8 |
+
{"dataset": "PatternCom-2","subset_id": 0, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
disjoint/scenario-14.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "Bongard-OpenWorld","subset_id": 1, "type":"multi-choice"},
|
6 |
+
{"dataset": "Co-Instruct-DB","subset_id": 0, "type":"multi-choice"},
|
7 |
+
{"dataset": "dvqa","subset_id": 0, "type":"multi-choice"},
|
8 |
+
{"dataset": "NLVR2","subset_id": 0, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
disjoint/scenario-15.json
ADDED
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "ScienceQA","subset_id": 4, "type":"onlyLang"},
|
6 |
+
{"dataset": "TextVQA","subset_id": 6, "type":"ocr"},
|
7 |
+
{"dataset": "ImageNet","subset_id": 4, "type":"classification"},
|
8 |
+
{"dataset": "GQA","subset_id": 4, "type":"truth-alignment"},
|
9 |
+
{"dataset": "VizWiz2","subset_id": 4, "type":"truth-alignment"},
|
10 |
+
{"dataset": "COCO2014","subset_id": 4, "type":"grounding"},
|
11 |
+
{"dataset": "COCO2014","subset_id": 5, "type":"truth-alignment"},
|
12 |
+
{"dataset": "OCR-VQA","subset_id": 4, "type":"truth-alignment"}
|
13 |
+
]
|
14 |
+
}
|
15 |
+
]
|
disjoint/scenario-16.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "M3IT","subset_id": 3, "type":"open-ended", "metric":"accuracy"},
|
6 |
+
{"dataset": "MANTIS","subset_id": 2, "type":"open-ended", "metric":"accuracy"},
|
7 |
+
{"dataset": "LaMM","subset_id": 2, "type":"open-ended", "metric":"accuracy"},
|
8 |
+
{"dataset": "VisionFLAN","subset_id": 2, "type":"open-ended", "metric":"accuracy"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
disjoint/scenario-17.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "Bongard-OpenWorld","subset_id": 99, "type":"multi-choice"},
|
6 |
+
{"dataset": "NLVR2-2","subset_id": 99, "type":"multi-choice"},
|
7 |
+
{"dataset": "Co-Instruct-DB2","subset_id": 99, "type":"multi-choice"},
|
8 |
+
{"dataset": "Bongard-HOI","subset_id": 99, "type":"multi-choice"},
|
9 |
+
{"dataset": "PatternCom-2","subset_id": 99, "type":"multi-choice"},
|
10 |
+
{"dataset": "dvqa2","subset_id": 99, "type":"multi-choice"},
|
11 |
+
{"dataset": "HQ_Edit2","subset_id": 99, "type":"multi-choice"}
|
12 |
+
]
|
13 |
+
}
|
14 |
+
]
|
disjoint/scenario-18.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "Bongard-OpenWorld","subset_id": 3, "type":"multi-choice"},
|
6 |
+
{"dataset": "Co-Instruct-DB","subset_id": 0, "type":"multi-choice"},
|
7 |
+
{"dataset": "dvqa","subset_id": 0, "type":"multi-choice"},
|
8 |
+
{"dataset": "HQ_Edit","subset_id": 0, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
disjoint/scenario-2.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "HRVQA","subset_id": 1, "type":"multi-choice"},
|
6 |
+
{"dataset": "Bongard-HOI","subset_id": 1, "type":"multi-choice"},
|
7 |
+
{"dataset": "mPLUG","subset_id": 0, "type":"open-ended"},
|
8 |
+
{"dataset": "NLVR2","subset_id": 0,"type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
disjoint/scenario-20.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "ChartQA2","subset_id": 0, "type":"open-ended", "metric":"accuracy"},
|
6 |
+
{"dataset": "DocVQA2","subset_id": 0, "type":"open-ended", "metric":"accuracy"},
|
7 |
+
{"dataset": "iconqa2","subset_id": 0, "type":"open-ended", "metric":"accuracy"},
|
8 |
+
{"dataset": "PathVQA2","subset_id": 0, "type":"open-ended", "metric":"accuracy"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
disjoint/scenario-22.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "PatternCom-2","subset_id": 0, "type":"multi-choice"},
|
6 |
+
{"dataset": "NLVR2-2","subset_id": 0, "type":"multi-choice"},
|
7 |
+
{"dataset": "HQ_Edit-2","subset_id": 0, "type":"multi-choice"},
|
8 |
+
{"dataset": "Bongard-HOI2","subset_id": 50, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
disjoint/scenario-28.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "HQ_Edit","subset_id": 0, "type":"multi-choice"},
|
6 |
+
{"dataset": "Bongard-OpenWorld","subset_id": 3, "type":"multi-choice"},
|
7 |
+
{"dataset": "dvqa","subset_id": 0, "type":"multi-choice"},
|
8 |
+
{"dataset": "Co-Instruct-DB","subset_id": 0, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
disjoint/scenario-3.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "HRVQA","subset_id": 1, "type":"multi-choice"},
|
6 |
+
{"dataset": "HRVQA","subset_id": 5, "type":"multi-choice"},
|
7 |
+
{"dataset": "HRVQA","subset_id": 6, "type":"multi-choice"},
|
8 |
+
{"dataset": "HRVQA","subset_id": 9, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
disjoint/scenario-32.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "HQ_Edit-2","subset_id": 0, "type":"multi-choice"},
|
6 |
+
{"dataset": "PatternCom-2","subset_id": 0, "type":"multi-choice"},
|
7 |
+
{"dataset": "Bongard-HOI2","subset_id": 50, "type":"multi-choice"},
|
8 |
+
{"dataset": "NLVR2-2","subset_id": 0, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
disjoint/scenario-38.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "dvqa","subset_id": 0, "type":"multi-choice"},
|
6 |
+
{"dataset": "HQ_Edit","subset_id": 0, "type":"multi-choice"},
|
7 |
+
{"dataset": "Bongard-OpenWorld","subset_id": 3, "type":"multi-choice"},
|
8 |
+
{"dataset": "Co-Instruct-DB","subset_id": 0, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
disjoint/scenario-4.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "HRVQA","subset_id": 100, "type":"multi-choice"},
|
6 |
+
{"dataset": "Bongard-HOI","subset_id": 100, "type":"multi-choice"},
|
7 |
+
{"dataset": "mPLUG","subset_id": 100, "type":"open-ended"},
|
8 |
+
{"dataset": "NLVR2","subset_id": 100,"type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
disjoint/scenario-5.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "Bongard-HOI","subset_id": 50, "type":"multi-choice"},
|
6 |
+
{"dataset": "Bongard-HOI","subset_id": 51, "type":"multi-choice"},
|
7 |
+
{"dataset": "Bongard-HOI","subset_id": 52, "type":"multi-choice"},
|
8 |
+
{"dataset": "Bongard-HOI","subset_id": 53, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
disjoint/scenario-6.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "Bongard-HOI","subset_id": 90, "type":"multi-choice"}
|
6 |
+
]
|
7 |
+
}
|
8 |
+
]
|
disjoint/scenario-7.json
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "WebQA","subset_id": 0, "type":"multi-choice"},
|
6 |
+
{"dataset": "AQUA","subset_id": 0, "type":"multi-choice"},
|
7 |
+
{"dataset": "TQA","subset_id": 0, "type":"multi-choice"},
|
8 |
+
{"dataset": "dvqa","subset_id": 0, "type":"multi-choice"}
|
9 |
+
|
10 |
+
]
|
11 |
+
}
|
12 |
+
]
|
disjoint/scenario-8.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "NLVR2","subset_id": 0, "type":"multi-choice"},
|
6 |
+
{"dataset": "HQ_Edit","subset_id": 0, "type":"multi-choice"},
|
7 |
+
{"dataset": "PatternCom","subset_id": 0, "type":"multi-choice"},
|
8 |
+
{"dataset": "Bongard-HOI","subset_id": 2, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
disjoint/scenario-9.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "dvqa","subset_id": 0, "type":"multi-choice"},
|
6 |
+
{"dataset": "HQ_Edit","subset_id": 0, "type":"multi-choice"},
|
7 |
+
{"dataset": "TQA","subset_id": 0, "type":"multi-choice"},
|
8 |
+
{"dataset": "PatternCom","subset_id": 0, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
fcl_scenarios/scenario-0.json
ADDED
@@ -0,0 +1,92 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "Fashion200K","subset_id": 0, "type":"multi-choice"},
|
6 |
+
{"dataset": "Fashion200K","subset_id": 2, "type":"multi-choice"},
|
7 |
+
{"dataset": "Fashion200K","subset_id": 3, "type":"multi-choice"},
|
8 |
+
{"dataset": "FashionIQ","subset_id": 0, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
},
|
11 |
+
{
|
12 |
+
"client_id": 1,
|
13 |
+
"datasets":[
|
14 |
+
{"dataset": "HRVQA","subset_id": 2, "type":"multi-choice"},
|
15 |
+
{"dataset": "HRVQA","subset_id": 5, "type":"multi-choice"},
|
16 |
+
{"dataset": "HRVQA","subset_id": 7, "type":"multi-choice"},
|
17 |
+
{"dataset": "HRVQA","subset_id": 9, "type":"multi-choice"}
|
18 |
+
]
|
19 |
+
},
|
20 |
+
{
|
21 |
+
"client_id": 2,
|
22 |
+
"datasets":[
|
23 |
+
{"dataset": "NLVR2","subset_id": 0,"type":"multi-choice"},
|
24 |
+
{"dataset": "CIRR","subset_id": 1,"type":"multi-choice"},
|
25 |
+
{"dataset": "HQ_Edit","subset_id": 0,"type":"multi-choice"},
|
26 |
+
{"dataset": "PatternCom","subset_id": 0,"type":"multi-choice"}
|
27 |
+
]
|
28 |
+
},
|
29 |
+
{
|
30 |
+
"client_id": 3,
|
31 |
+
"datasets":[
|
32 |
+
{"dataset": "WebQA","subset_id": 0, "type":"open-ended", "metric":"F1"},
|
33 |
+
{"dataset": "TQA","subset_id": 0, "type":"multi-choice"},
|
34 |
+
{"dataset": "AQUA","subset_id": 0, "type":"open-ended", "metric":"F1"},
|
35 |
+
{"dataset": "dvqa","subset_id": 0, "type":"multi-choice"}
|
36 |
+
]
|
37 |
+
},
|
38 |
+
{
|
39 |
+
"client_id": 4,
|
40 |
+
"datasets":[
|
41 |
+
{"dataset": "Bongard-OpenWorld","subset_id": 3, "type":"multi-choice"},
|
42 |
+
{"dataset": "Bongard-OpenWorld","subset_id": 1, "type":"multi-choice"},
|
43 |
+
{"dataset": "Bongard-HOI","subset_id": 0, "type":"multi-choice"},
|
44 |
+
{"dataset": "Bongard-HOI","subset_id": 1, "type":"multi-choice"}
|
45 |
+
]
|
46 |
+
},
|
47 |
+
{
|
48 |
+
"client_id": 5,
|
49 |
+
"datasets":[
|
50 |
+
{"dataset": "iconqa","subset_id": 0, "type":"multi-choice"},
|
51 |
+
{"dataset": "iconqa","subset_id": 1, "type":"multi-choice"},
|
52 |
+
{"dataset": "iconqa","subset_id": 2, "type":"open-ended", "metric":"F1"},
|
53 |
+
{"dataset": "iconqa","subset_id": 3, "type":"open-ended", "metric":"F1"}
|
54 |
+
]
|
55 |
+
},
|
56 |
+
{
|
57 |
+
"client_id": 6,
|
58 |
+
"datasets":[
|
59 |
+
{"dataset": "Co-Instruct-DB","subset_id": 0, "type":"multi-choice"},
|
60 |
+
{"dataset": "Co-Instruct-DB","subset_id": 1, "type":"multi-choice"},
|
61 |
+
{"dataset": "Co-Instruct-DB","subset_id": 2, "type":"open-ended", "metric":"RougeL"},
|
62 |
+
{"dataset": "Co-Instruct-DB","subset_id": 3, "type":"open-ended", "metric":"RougeL"}
|
63 |
+
]
|
64 |
+
},
|
65 |
+
{
|
66 |
+
"client_id": 7,
|
67 |
+
"datasets":[
|
68 |
+
{"dataset": "Spot-the-Diff","subset_id": 0, "type":"open-ended", "metric":"RougeL"},
|
69 |
+
{"dataset": "Birds-to-Words","subset_id": 0, "type":"open-ended", "metric":"RougeL"},
|
70 |
+
{"dataset": "IEdit","subset_id": 0, "type":"open-ended", "metric":"RougeL"},
|
71 |
+
{"dataset": "CLEVR-Change","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
|
72 |
+
]
|
73 |
+
},
|
74 |
+
{
|
75 |
+
"client_id": 8,
|
76 |
+
"datasets":[
|
77 |
+
{"dataset": "PororoSV","subset_id": 0, "type":"open-ended", "metric":"RougeL"},
|
78 |
+
{"dataset": "FlintstonesSV","subset_id": 0, "type":"open-ended", "metric":"RougeL"},
|
79 |
+
{"dataset": "VIST","subset_id": 0, "type":"open-ended", "metric":"RougeL"},
|
80 |
+
{"dataset": "AESOP","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
|
81 |
+
]
|
82 |
+
},
|
83 |
+
{
|
84 |
+
"client_id": 9,
|
85 |
+
"datasets":[
|
86 |
+
{"dataset": "VISION","subset_id": 0, "type":"multi-choice"},
|
87 |
+
{"dataset": "VISION","subset_id": 1, "type":"multi-choice"},
|
88 |
+
{"dataset": "VizWiz","subset_id": 0, "type":"multi-choice"},
|
89 |
+
{"dataset": "MIT-States","subset_id": 0, "type":"multi-choice"}
|
90 |
+
]
|
91 |
+
}
|
92 |
+
]
|
fcl_scenarios/scenario-1.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "HRVQA","subset_id": 1, "type":"multi-choice"},
|
6 |
+
{"dataset": "HRVQA","subset_id": 6, "type":"multi-choice"},
|
7 |
+
{"dataset": "iconqa","subset_id": 4, "type":"multi-choice"},
|
8 |
+
{"dataset": "ALFRED","subset_id": 0, "type":"open-ended", "metric":"RougeL"},
|
9 |
+
{"dataset": "DiDeMoSV","subset_id": 0, "type":"open-ended", "metric":"RougeL"},
|
10 |
+
{"dataset": "COMICS_Dialogue","subset_id": 0, "type":"multi-choice"},
|
11 |
+
{"dataset": "RecipeQA_ImageCoherence","subset_id": 0,"type":"multi-choice"}
|
12 |
+
]
|
13 |
+
}
|
14 |
+
]
|
fcl_scenarios/scenario-10.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "DreamSim","subset_id": 0,"type":"multi-choice"}
|
6 |
+
]
|
7 |
+
},
|
8 |
+
{
|
9 |
+
"client_id": 1,
|
10 |
+
"datasets":[
|
11 |
+
{"dataset": "Mementos","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
|
12 |
+
]
|
13 |
+
},
|
14 |
+
{
|
15 |
+
"client_id": 2,
|
16 |
+
"datasets":[
|
17 |
+
{"dataset": "Bongard-HOI","subset_id": 2, "type":"multi-choice"}
|
18 |
+
]
|
19 |
+
},
|
20 |
+
{
|
21 |
+
"client_id": 3,
|
22 |
+
"datasets":[
|
23 |
+
{"dataset": "Co-Instruct-DB","subset_id": 8, "type":"multi-choice"}
|
24 |
+
]
|
25 |
+
}
|
26 |
+
]
|
fcl_scenarios/scenario-2.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "ALFRED","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
|
6 |
+
]
|
7 |
+
},
|
8 |
+
{
|
9 |
+
"client_id": 1,
|
10 |
+
"datasets":[
|
11 |
+
{"dataset": "DiDeMoSV","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
|
12 |
+
]
|
13 |
+
},
|
14 |
+
{
|
15 |
+
"client_id": 2,
|
16 |
+
"datasets":[
|
17 |
+
{"dataset": "COMICS_Dialogue","subset_id": 0, "type":"multi-choice"}
|
18 |
+
]
|
19 |
+
},
|
20 |
+
{
|
21 |
+
"client_id": 3,
|
22 |
+
"datasets":[
|
23 |
+
{"dataset": "RecipeQA_ImageCoherence","subset_id": 0,"type":"multi-choice"}
|
24 |
+
]
|
25 |
+
}
|
26 |
+
]
|
fcl_scenarios/scenario-20.json
ADDED
@@ -0,0 +1,92 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "RecipeQA_TextCloze","subset_id": 0, "type":"multi-choice"},
|
6 |
+
{"dataset": "RecipeQA_VisualCloze","subset_id": 0, "type":"multi-choice"},
|
7 |
+
{"dataset": "COMICS_Dialogue","subset_id": 0, "type":"multi-choice"},
|
8 |
+
{"dataset": "COMICS_Panel","subset_id": 0, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
},
|
11 |
+
{
|
12 |
+
"client_id": 1,
|
13 |
+
"datasets":[
|
14 |
+
{"dataset": "HRVQA","subset_id": 1, "type":"multi-choice"},
|
15 |
+
{"dataset": "HRVQA","subset_id": 5, "type":"multi-choice"},
|
16 |
+
{"dataset": "HRVQA","subset_id": 6, "type":"multi-choice"},
|
17 |
+
{"dataset": "HRVQA","subset_id": 9, "type":"multi-choice"}
|
18 |
+
]
|
19 |
+
},
|
20 |
+
{
|
21 |
+
"client_id": 2,
|
22 |
+
"datasets":[
|
23 |
+
{"dataset": "Fashion200K","subset_id": 0,"type":"multi-choice"},
|
24 |
+
{"dataset": "Fashion200K","subset_id": 1,"type":"multi-choice"},
|
25 |
+
{"dataset": "RecipeQA_ImageCoherence","subset_id": 0,"type":"multi-choice"},
|
26 |
+
{"dataset": "NLVR2","subset_id": 0,"type":"multi-choice"}
|
27 |
+
]
|
28 |
+
},
|
29 |
+
{
|
30 |
+
"client_id": 3,
|
31 |
+
"datasets":[
|
32 |
+
{"dataset": "WebQA","subset_id": 0, "type":"open-ended"},
|
33 |
+
{"dataset": "TQA","subset_id": 0, "type":"multi-choice"},
|
34 |
+
{"dataset": "AQUA","subset_id": 0, "type":"open-ended"},
|
35 |
+
{"dataset": "AQUA","subset_id": 1, "type":"open-ended"}
|
36 |
+
]
|
37 |
+
},
|
38 |
+
{
|
39 |
+
"client_id": 4,
|
40 |
+
"datasets":[
|
41 |
+
{"dataset": "Bongard-OpenWorld","subset_id": 0, "type":"open-ended"},
|
42 |
+
{"dataset": "Bongard-OpenWorld","subset_id": 1, "type":"multi-choice"},
|
43 |
+
{"dataset": "Bongard-HOI","subset_id": 0, "type":"multi-choice"},
|
44 |
+
{"dataset": "Bongard-HOI","subset_id": 1, "type":"multi-choice"}
|
45 |
+
]
|
46 |
+
},
|
47 |
+
{
|
48 |
+
"client_id": 5,
|
49 |
+
"datasets":[
|
50 |
+
{"dataset": "HRVQA","subset_id": 2, "type":"multi-choice"},
|
51 |
+
{"dataset": "HRVQA","subset_id": 4, "type":"multi-choice"},
|
52 |
+
{"dataset": "HRVQA","subset_id": 7, "type":"multi-choice"},
|
53 |
+
{"dataset": "HRVQA","subset_id": 8, "type":"multi-choice"}
|
54 |
+
]
|
55 |
+
},
|
56 |
+
{
|
57 |
+
"client_id": 6,
|
58 |
+
"datasets":[
|
59 |
+
{"dataset": "mPLUG","subset_id": 0, "type":"open-ended"},
|
60 |
+
{"dataset": "mPLUG","subset_id": 1, "type":"open-ended"},
|
61 |
+
{"dataset": "mPLUG","subset_id": 2, "type":"open-ended"},
|
62 |
+
{"dataset": "mPLUG","subset_id": 4, "type":"open-ended"}
|
63 |
+
]
|
64 |
+
},
|
65 |
+
{
|
66 |
+
"client_id": 7,
|
67 |
+
"datasets":[
|
68 |
+
{"dataset": "Spot-the-Diff","subset_id": 0, "type":"open-ended"},
|
69 |
+
{"dataset": "Birds-to-Words","subset_id": 0, "type":"open-ended"},
|
70 |
+
{"dataset": "IEdit","subset_id": 0, "type":"open-ended"},
|
71 |
+
{"dataset": "CLEVR-Change","subset_id": 0, "type":"open-ended"}
|
72 |
+
]
|
73 |
+
},
|
74 |
+
{
|
75 |
+
"client_id": 8,
|
76 |
+
"datasets":[
|
77 |
+
{"dataset": "PororoSV","subset_id": 0, "type":"open-ended"},
|
78 |
+
{"dataset": "FlintstonesSV","subset_id": 0, "type":"open-ended"},
|
79 |
+
{"dataset": "VIST","subset_id": 0, "type":"open-ended"},
|
80 |
+
{"dataset": "AESOP","subset_id": 0, "type":"open-ended"}
|
81 |
+
]
|
82 |
+
},
|
83 |
+
{
|
84 |
+
"client_id": 9,
|
85 |
+
"datasets":[
|
86 |
+
{"dataset": "VISION","subset_id": 0, "type":"multi-choice"},
|
87 |
+
{"dataset": "VISION","subset_id": 1, "type":"multi-choice"},
|
88 |
+
{"dataset": "VizWiz","subset_id": 0, "type":"multi-choice"},
|
89 |
+
{"dataset": "MIT-States","subset_id": 0, "type":"multi-choice"}
|
90 |
+
]
|
91 |
+
}
|
92 |
+
]
|
fcl_scenarios/scenario-21.json
ADDED
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "Fashion200K","subset_id": 0,"type":"multi-choice"},
|
6 |
+
{"dataset": "Fashion200K","subset_id": 1,"type":"multi-choice"},
|
7 |
+
{"dataset": "RecipeQA_ImageCoherence","subset_id": 0,"type":"multi-choice"},
|
8 |
+
{"dataset": "NLVR2","subset_id": 0,"type":"multi-choice"}
|
9 |
+
]
|
10 |
+
},
|
11 |
+
{
|
12 |
+
"client_id": 1,
|
13 |
+
"datasets":[
|
14 |
+
{"dataset": "VISION","subset_id": 0, "type":"multi-choice"},
|
15 |
+
{"dataset": "VISION","subset_id": 1, "type":"multi-choice"},
|
16 |
+
{"dataset": "VizWiz","subset_id": 0, "type":"multi-choice"},
|
17 |
+
{"dataset": "MIT-States","subset_id": 0, "type":"multi-choice"}
|
18 |
+
]
|
19 |
+
}
|
20 |
+
]
|
fcl_scenarios/scenario-22.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "RecipeQA_TextCloze","subset_id": 0, "type":"multi-choice"},
|
6 |
+
{"dataset": "RecipeQA_VisualCloze","subset_id": 0, "type":"multi-choice"},
|
7 |
+
{"dataset": "COMICS_Dialogue","subset_id": 0, "type":"multi-choice"},
|
8 |
+
{"dataset": "COMICS_Panel","subset_id": 0, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
},
|
11 |
+
{
|
12 |
+
"client_id": 1,
|
13 |
+
"datasets":[
|
14 |
+
{"dataset": "Fashion200K","subset_id": 0,"type":"multi-choice"},
|
15 |
+
{"dataset": "Fashion200K","subset_id": 1,"type":"multi-choice"},
|
16 |
+
{"dataset": "RecipeQA_ImageCoherence","subset_id": 0,"type":"multi-choice"},
|
17 |
+
{"dataset": "NLVR2","subset_id": 0,"type":"multi-choice"}
|
18 |
+
]
|
19 |
+
},
|
20 |
+
{
|
21 |
+
"client_id": 2,
|
22 |
+
"datasets":[
|
23 |
+
{"dataset": "Bongard-OpenWorld","subset_id": 0, "type":"open-ended"},
|
24 |
+
{"dataset": "Bongard-OpenWorld","subset_id": 1, "type":"multi-choice"},
|
25 |
+
{"dataset": "Bongard-HOI","subset_id": 0, "type":"multi-choice"},
|
26 |
+
{"dataset": "Bongard-HOI","subset_id": 1, "type":"multi-choice"}
|
27 |
+
]
|
28 |
+
},
|
29 |
+
{
|
30 |
+
"client_id": 3,
|
31 |
+
"datasets":[
|
32 |
+
{"dataset": "VISION","subset_id": 0, "type":"multi-choice"},
|
33 |
+
{"dataset": "VISION","subset_id": 1, "type":"multi-choice"},
|
34 |
+
{"dataset": "VizWiz","subset_id": 0, "type":"multi-choice"},
|
35 |
+
{"dataset": "MIT-States","subset_id": 0, "type":"multi-choice"}
|
36 |
+
]
|
37 |
+
}
|
38 |
+
]
|
fcl_scenarios/scenario-23.json
ADDED
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "RecipeQA_TextCloze","subset_id": 0, "type":"multi-choice"},
|
6 |
+
{"dataset": "RecipeQA_VisualCloze","subset_id": 0, "type":"multi-choice"},
|
7 |
+
{"dataset": "COMICS_Dialogue","subset_id": 0, "type":"multi-choice"},
|
8 |
+
{"dataset": "COMICS_Panel","subset_id": 0, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
}
|
11 |
+
]
|
fcl_scenarios/scenario-24.json
ADDED
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "Fashion200K","subset_id": 0,"type":"multi-choice"},
|
6 |
+
{"dataset": "Fashion200K","subset_id": 1,"type":"multi-choice"},
|
7 |
+
{"dataset": "RecipeQA_ImageCoherence","subset_id": 0,"type":"multi-choice"},
|
8 |
+
{"dataset": "NLVR2","subset_id": 0,"type":"multi-choice"}
|
9 |
+
]
|
10 |
+
},
|
11 |
+
{
|
12 |
+
"client_id": 1,
|
13 |
+
"datasets":[
|
14 |
+
{"dataset": "VISION","subset_id": 0, "type":"multi-choice"},
|
15 |
+
{"dataset": "VISION","subset_id": 1, "type":"multi-choice"},
|
16 |
+
{"dataset": "VizWiz","subset_id": 0, "type":"multi-choice"},
|
17 |
+
{"dataset": "MIT-States","subset_id": 0, "type":"multi-choice"}
|
18 |
+
]
|
19 |
+
}
|
20 |
+
]
|
fcl_scenarios/scenario-28.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "HRVQA","subset_id": 1, "type":"multi-choice"},
|
6 |
+
{"dataset": "HRVQA","subset_id": 5, "type":"multi-choice"},
|
7 |
+
{"dataset": "HRVQA","subset_id": 6, "type":"multi-choice"},
|
8 |
+
{"dataset": "HRVQA","subset_id": 9, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
},
|
11 |
+
{
|
12 |
+
"client_id": 1,
|
13 |
+
"datasets":[
|
14 |
+
{"dataset": "WebQA","subset_id": 0, "type":"open-ended"},
|
15 |
+
{"dataset": "TQA","subset_id": 0, "type":"multi-choice"},
|
16 |
+
{"dataset": "AQUA","subset_id": 0, "type":"open-ended"},
|
17 |
+
{"dataset": "AQUA","subset_id": 1, "type":"open-ended"}
|
18 |
+
]
|
19 |
+
},
|
20 |
+
{
|
21 |
+
"client_id": 2,
|
22 |
+
"datasets":[
|
23 |
+
{"dataset": "Spot-the-Diff","subset_id": 0, "type":"open-ended"},
|
24 |
+
{"dataset": "Birds-to-Words","subset_id": 0, "type":"open-ended"},
|
25 |
+
{"dataset": "IEdit","subset_id": 0, "type":"open-ended"},
|
26 |
+
{"dataset": "CLEVR-Change","subset_id": 0, "type":"open-ended"}
|
27 |
+
]
|
28 |
+
},
|
29 |
+
{
|
30 |
+
"client_id": 3,
|
31 |
+
"datasets":[
|
32 |
+
{"dataset": "VISION","subset_id": 0, "type":"multi-choice"},
|
33 |
+
{"dataset": "VISION","subset_id": 1, "type":"multi-choice"},
|
34 |
+
{"dataset": "VizWiz","subset_id": 0, "type":"multi-choice"},
|
35 |
+
{"dataset": "MIT-States","subset_id": 0, "type":"multi-choice"}
|
36 |
+
]
|
37 |
+
}
|
38 |
+
]
|
fcl_scenarios/scenario-29.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "RecipeQA_TextCloze","subset_id": 0, "type":"multi-choice"},
|
6 |
+
{"dataset": "RecipeQA_VisualCloze","subset_id": 0, "type":"multi-choice"},
|
7 |
+
{"dataset": "COMICS_Dialogue","subset_id": 0, "type":"multi-choice"},
|
8 |
+
{"dataset": "COMICS_Panel","subset_id": 0, "type":"multi-choice"}
|
9 |
+
]
|
10 |
+
},
|
11 |
+
{
|
12 |
+
"client_id": 1,
|
13 |
+
"datasets":[
|
14 |
+
{"dataset": "HRVQA","subset_id": 1, "type":"multi-choice"},
|
15 |
+
{"dataset": "HRVQA","subset_id": 5, "type":"multi-choice"},
|
16 |
+
{"dataset": "HRVQA","subset_id": 6, "type":"multi-choice"},
|
17 |
+
{"dataset": "HRVQA","subset_id": 9, "type":"multi-choice"}
|
18 |
+
]
|
19 |
+
},
|
20 |
+
{
|
21 |
+
"client_id": 2,
|
22 |
+
"datasets":[
|
23 |
+
{"dataset": "Bongard-OpenWorld","subset_id": 0, "type":"open-ended"},
|
24 |
+
{"dataset": "Bongard-OpenWorld","subset_id": 1, "type":"multi-choice"},
|
25 |
+
{"dataset": "Bongard-HOI","subset_id": 0, "type":"multi-choice"},
|
26 |
+
{"dataset": "Bongard-HOI","subset_id": 1, "type":"multi-choice"}
|
27 |
+
]
|
28 |
+
},
|
29 |
+
{
|
30 |
+
"client_id": 3,
|
31 |
+
"datasets":[
|
32 |
+
{"dataset": "PororoSV","subset_id": 0, "type":"open-ended"},
|
33 |
+
{"dataset": "FlintstonesSV","subset_id": 0, "type":"open-ended"},
|
34 |
+
{"dataset": "VIST","subset_id": 0, "type":"open-ended"},
|
35 |
+
{"dataset": "AESOP","subset_id": 0, "type":"open-ended"}
|
36 |
+
]
|
37 |
+
}
|
38 |
+
]
|
fcl_scenarios/scenario-3.json
ADDED
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "mPLUG","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
|
6 |
+
]
|
7 |
+
},
|
8 |
+
{
|
9 |
+
"client_id": 1,
|
10 |
+
"datasets":[
|
11 |
+
{"dataset": "iconqa","subset_id": 4, "type":"multi-choice"}
|
12 |
+
]
|
13 |
+
},
|
14 |
+
{
|
15 |
+
"client_id": 2,
|
16 |
+
"datasets":[
|
17 |
+
{"dataset": "RecipeQA_TextCloze","subset_id": 0, "type":"multi-choice"}
|
18 |
+
]
|
19 |
+
}
|
20 |
+
]
|
fcl_scenarios/scenario-4.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "mPLUG","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
|
6 |
+
]
|
7 |
+
},
|
8 |
+
{
|
9 |
+
"client_id": 1,
|
10 |
+
"datasets":[
|
11 |
+
{"dataset": "iconqa","subset_id": 4, "type":"multi-choice"}
|
12 |
+
]
|
13 |
+
}
|
14 |
+
]
|
fcl_scenarios/scenario-40.json
ADDED
@@ -0,0 +1,242 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"client_id": 0,
|
4 |
+
"datasets":[
|
5 |
+
{"dataset": "Fashion200K","subset_id": 0, "type":"multi-choice"}
|
6 |
+
]
|
7 |
+
},
|
8 |
+
{
|
9 |
+
"client_id": 1,
|
10 |
+
"datasets":[
|
11 |
+
{"dataset": "Fashion200K","subset_id": 2, "type":"multi-choice"}
|
12 |
+
]
|
13 |
+
},
|
14 |
+
{
|
15 |
+
"client_id": 2,
|
16 |
+
"datasets":[
|
17 |
+
{"dataset": "Fashion200K","subset_id": 3, "type":"multi-choice"}
|
18 |
+
]
|
19 |
+
},
|
20 |
+
{
|
21 |
+
"client_id": 3,
|
22 |
+
"datasets":[
|
23 |
+
{"dataset": "FashionIQ","subset_id": 0, "type":"multi-choice"}
|
24 |
+
]
|
25 |
+
},
|
26 |
+
{
|
27 |
+
"client_id": 4,
|
28 |
+
"datasets":[
|
29 |
+
{"dataset": "HRVQA","subset_id": 2, "type":"multi-choice"}
|
30 |
+
]
|
31 |
+
},
|
32 |
+
{
|
33 |
+
"client_id": 5,
|
34 |
+
"datasets":[
|
35 |
+
{"dataset": "HRVQA","subset_id": 5, "type":"multi-choice"}
|
36 |
+
]
|
37 |
+
},
|
38 |
+
{
|
39 |
+
"client_id": 6,
|
40 |
+
"datasets":[
|
41 |
+
{"dataset": "HRVQA","subset_id": 7, "type":"multi-choice"}
|
42 |
+
]
|
43 |
+
},
|
44 |
+
{
|
45 |
+
"client_id": 7,
|
46 |
+
"datasets":[
|
47 |
+
{"dataset": "HRVQA","subset_id": 9, "type":"multi-choice"}
|
48 |
+
]
|
49 |
+
},
|
50 |
+
{
|
51 |
+
"client_id": 8,
|
52 |
+
"datasets":[
|
53 |
+
{"dataset": "NLVR2","subset_id": 0,"type":"multi-choice"}
|
54 |
+
]
|
55 |
+
},
|
56 |
+
{
|
57 |
+
"client_id": 9,
|
58 |
+
"datasets":[
|
59 |
+
{"dataset": "CIRR","subset_id": 1,"type":"multi-choice"}
|
60 |
+
]
|
61 |
+
},
|
62 |
+
{
|
63 |
+
"client_id": 10,
|
64 |
+
"datasets":[
|
65 |
+
{"dataset": "HQ_Edit","subset_id": 0,"type":"multi-choice"}
|
66 |
+
]
|
67 |
+
},
|
68 |
+
{
|
69 |
+
"client_id": 11,
|
70 |
+
"datasets":[
|
71 |
+
{"dataset": "PatternCom","subset_id": 0,"type":"multi-choice"}
|
72 |
+
]
|
73 |
+
},
|
74 |
+
{
|
75 |
+
"client_id": 12,
|
76 |
+
"datasets":[
|
77 |
+
{"dataset": "WebQA","subset_id": 0, "type":"open-ended", "metric":"F1"}
|
78 |
+
]
|
79 |
+
},
|
80 |
+
{
|
81 |
+
"client_id": 13,
|
82 |
+
"datasets":[
|
83 |
+
{"dataset": "TQA","subset_id": 0, "type":"multi-choice"}
|
84 |
+
]
|
85 |
+
},
|
86 |
+
{
|
87 |
+
"client_id": 14,
|
88 |
+
"datasets":[
|
89 |
+
{"dataset": "AQUA","subset_id": 0, "type":"open-ended", "metric":"F1"}
|
90 |
+
]
|
91 |
+
},
|
92 |
+
{
|
93 |
+
"client_id": 15,
|
94 |
+
"datasets":[
|
95 |
+
{"dataset": "dvqa","subset_id": 0, "type":"multi-choice"}
|
96 |
+
]
|
97 |
+
},
|
98 |
+
{
|
99 |
+
"client_id": 16,
|
100 |
+
"datasets":[
|
101 |
+
{"dataset": "Bongard-OpenWorld","subset_id": 3, "type":"multi-choice"}
|
102 |
+
]
|
103 |
+
},
|
104 |
+
{
|
105 |
+
"client_id": 17,
|
106 |
+
"datasets":[
|
107 |
+
{"dataset": "Bongard-OpenWorld","subset_id": 1, "type":"multi-choice"}
|
108 |
+
]
|
109 |
+
},
|
110 |
+
{
|
111 |
+
"client_id": 18,
|
112 |
+
"datasets":[
|
113 |
+
{"dataset": "Bongard-HOI","subset_id": 0, "type":"multi-choice"}
|
114 |
+
]
|
115 |
+
},
|
116 |
+
{
|
117 |
+
"client_id": 19,
|
118 |
+
"datasets":[
|
119 |
+
{"dataset": "Bongard-HOI","subset_id": 1, "type":"multi-choice"}
|
120 |
+
]
|
121 |
+
},
|
122 |
+
{
|
123 |
+
"client_id": 20,
|
124 |
+
"datasets":[
|
125 |
+
{"dataset": "iconqa","subset_id": 0, "type":"multi-choice"}
|
126 |
+
]
|
127 |
+
},
|
128 |
+
{
|
129 |
+
"client_id": 21,
|
130 |
+
"datasets":[
|
131 |
+
{"dataset": "iconqa","subset_id": 1, "type":"multi-choice"}
|
132 |
+
]
|
133 |
+
},
|
134 |
+
{
|
135 |
+
"client_id": 22,
|
136 |
+
"datasets":[
|
137 |
+
{"dataset": "iconqa","subset_id": 2, "type":"open-ended", "metric":"F1"}
|
138 |
+
]
|
139 |
+
},
|
140 |
+
{
|
141 |
+
"client_id": 23,
|
142 |
+
"datasets":[
|
143 |
+
{"dataset": "iconqa","subset_id": 3, "type":"open-ended", "metric":"F1"}
|
144 |
+
]
|
145 |
+
},
|
146 |
+
{
|
147 |
+
"client_id": 24,
|
148 |
+
"datasets":[
|
149 |
+
{"dataset": "Co-Instruct-DB","subset_id": 0, "type":"multi-choice"}
|
150 |
+
]
|
151 |
+
},
|
152 |
+
{
|
153 |
+
"client_id": 25,
|
154 |
+
"datasets":[
|
155 |
+
{"dataset": "Co-Instruct-DB","subset_id": 1, "type":"multi-choice"}
|
156 |
+
]
|
157 |
+
},
|
158 |
+
{
|
159 |
+
"client_id": 26,
|
160 |
+
"datasets":[
|
161 |
+
{"dataset": "Co-Instruct-DB","subset_id": 2, "type":"open-ended", "metric":"RougeL"}
|
162 |
+
]
|
163 |
+
},
|
164 |
+
{
|
165 |
+
"client_id": 27,
|
166 |
+
"datasets":[
|
167 |
+
{"dataset": "Co-Instruct-DB","subset_id": 3, "type":"open-ended", "metric":"RougeL"}
|
168 |
+
]
|
169 |
+
},
|
170 |
+
{
|
171 |
+
"client_id": 28,
|
172 |
+
"datasets":[
|
173 |
+
{"dataset": "Spot-the-Diff","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
|
174 |
+
]
|
175 |
+
},
|
176 |
+
{
|
177 |
+
"client_id": 29,
|
178 |
+
"datasets":[
|
179 |
+
{"dataset": "Birds-to-Words","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
|
180 |
+
]
|
181 |
+
},
|
182 |
+
{
|
183 |
+
"client_id": 30,
|
184 |
+
"datasets":[
|
185 |
+
{"dataset": "IEdit","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
|
186 |
+
]
|
187 |
+
},
|
188 |
+
{
|
189 |
+
"client_id": 31,
|
190 |
+
"datasets":[
|
191 |
+
{"dataset": "CLEVR-Change","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
|
192 |
+
]
|
193 |
+
},
|
194 |
+
{
|
195 |
+
"client_id": 32,
|
196 |
+
"datasets":[
|
197 |
+
{"dataset": "PororoSV","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
|
198 |
+
]
|
199 |
+
},
|
200 |
+
{
|
201 |
+
"client_id": 33,
|
202 |
+
"datasets":[
|
203 |
+
{"dataset": "FlintstonesSV","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
|
204 |
+
]
|
205 |
+
},
|
206 |
+
{
|
207 |
+
"client_id": 34,
|
208 |
+
"datasets":[
|
209 |
+
{"dataset": "VIST","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
|
210 |
+
]
|
211 |
+
},
|
212 |
+
{
|
213 |
+
"client_id": 35,
|
214 |
+
"datasets":[
|
215 |
+
{"dataset": "AESOP","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
|
216 |
+
]
|
217 |
+
},
|
218 |
+
{
|
219 |
+
"client_id": 36,
|
220 |
+
"datasets":[
|
221 |
+
{"dataset": "VISION","subset_id": 0, "type":"multi-choice"}
|
222 |
+
]
|
223 |
+
},
|
224 |
+
{
|
225 |
+
"client_id": 37,
|
226 |
+
"datasets":[
|
227 |
+
{"dataset": "VISION","subset_id": 1, "type":"multi-choice"}
|
228 |
+
]
|
229 |
+
},
|
230 |
+
{
|
231 |
+
"client_id": 38,
|
232 |
+
"datasets":[
|
233 |
+
{"dataset": "VizWiz","subset_id": 0, "type":"multi-choice"}
|
234 |
+
]
|
235 |
+
},
|
236 |
+
{
|
237 |
+
"client_id": 39,
|
238 |
+
"datasets":[
|
239 |
+
{"dataset": "MIT-States","subset_id": 0, "type":"multi-choice"}
|
240 |
+
]
|
241 |
+
}
|
242 |
+
]
|