mjleee commited on
Commit
0c0a4b5
·
verified ·
1 Parent(s): 6394d21

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. all_tasks.json +34 -0
  2. continuous/scenario-11.json +11 -0
  3. continuous/scenario-12.json +11 -0
  4. continuous/scenario-14.json +11 -0
  5. continuous/scenario-18.json +11 -0
  6. continuous/scenario-5.json +11 -0
  7. continuous/scenario-8.json +11 -0
  8. create_scenario.py +42 -0
  9. disjoint/scenario-1.json +8 -0
  10. disjoint/scenario-10.json +11 -0
  11. disjoint/scenario-102.json +8 -0
  12. disjoint/scenario-103.json +8 -0
  13. disjoint/scenario-104.json +8 -0
  14. disjoint/scenario-105.json +8 -0
  15. disjoint/scenario-106.json +8 -0
  16. disjoint/scenario-107.json +8 -0
  17. disjoint/scenario-11.json +11 -0
  18. disjoint/scenario-12.json +11 -0
  19. disjoint/scenario-14.json +11 -0
  20. disjoint/scenario-15.json +15 -0
  21. disjoint/scenario-16.json +11 -0
  22. disjoint/scenario-17.json +14 -0
  23. disjoint/scenario-18.json +11 -0
  24. disjoint/scenario-2.json +11 -0
  25. disjoint/scenario-20.json +11 -0
  26. disjoint/scenario-22.json +11 -0
  27. disjoint/scenario-28.json +11 -0
  28. disjoint/scenario-3.json +11 -0
  29. disjoint/scenario-32.json +11 -0
  30. disjoint/scenario-38.json +11 -0
  31. disjoint/scenario-4.json +11 -0
  32. disjoint/scenario-5.json +11 -0
  33. disjoint/scenario-6.json +8 -0
  34. disjoint/scenario-7.json +12 -0
  35. disjoint/scenario-8.json +11 -0
  36. disjoint/scenario-9.json +11 -0
  37. fcl_scenarios/scenario-0.json +92 -0
  38. fcl_scenarios/scenario-1.json +14 -0
  39. fcl_scenarios/scenario-10.json +26 -0
  40. fcl_scenarios/scenario-2.json +26 -0
  41. fcl_scenarios/scenario-20.json +92 -0
  42. fcl_scenarios/scenario-21.json +20 -0
  43. fcl_scenarios/scenario-22.json +38 -0
  44. fcl_scenarios/scenario-23.json +11 -0
  45. fcl_scenarios/scenario-24.json +20 -0
  46. fcl_scenarios/scenario-28.json +38 -0
  47. fcl_scenarios/scenario-29.json +38 -0
  48. fcl_scenarios/scenario-3.json +20 -0
  49. fcl_scenarios/scenario-4.json +14 -0
  50. fcl_scenarios/scenario-40.json +242 -0
all_tasks.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {"dataset": "AQUA","subset_id": 0, "task_name": "no external knowledge"},
3
+ {"dataset": "AQUA","subset_id": 1, "task_name": "need external knowledge 1"},
4
+ {"dataset": "AQUA","subset_id": 2, "task_name": "need external knowledge 2"},
5
+ {"dataset": "Mementos","subset_id": 0},
6
+ {"dataset": "SciCap","subset_id": 0, "task_name": "Yes-subfig"},
7
+ {"dataset": "SciCap","subset_id": 1, "task_name": "No-subfig"},
8
+ {"dataset": "Bongard-OpenWorld","subset_id": 0},
9
+ {"dataset": "HRVQA","subset_id": 0, "task_name": "areas"},
10
+ {"dataset": "HRVQA","subset_id": 1, "task_name": "color"},
11
+ {"dataset": "HRVQA","subset_id": 2, "task_name": "location"},
12
+ {"dataset": "HRVQA","subset_id": 3, "task_name": "numbers"},
13
+ {"dataset": "HRVQA","subset_id": 4, "task_name": "scene"},
14
+ {"dataset": "HRVQA","subset_id": 5, "task_name": "shape"},
15
+ {"dataset": "HRVQA","subset_id": 6, "task_name": "size"},
16
+ {"dataset": "HRVQA","subset_id": 7, "task_name": "sports"},
17
+ {"dataset": "HRVQA","subset_id": 8, "task_name": "transportation"},
18
+ {"dataset": "HRVQA","subset_id": 9, "task_name": "yes no"},
19
+ {"dataset": "mPLUG","subset_id": 0, "task_name": "areas"},
20
+ {"dataset": "mPLUG","subset_id": 1, "task_name": "color"},
21
+ {"dataset": "mPLUG","subset_id": 2, "task_name": "location"},
22
+ {"dataset": "mPLUG","subset_id": 3, "task_name": "numbers"},
23
+ {"dataset": "mPLUG","subset_id": 4, "task_name": "scene"},
24
+ {"dataset": "mPLUG","subset_id": 5, "task_name": "shape"},
25
+ {"dataset": "mPLUG","subset_id": 6, "task_name": "size"},
26
+ {"dataset": "mPLUG","subset_id": 7, "task_name": "sports"},
27
+ {"dataset": "Birds-to-Words","subset_id": 0},
28
+ {"dataset": "DiDeMoSV","subset_id": 0},
29
+ {"dataset": "VIST","subset_id": 0},
30
+ {"dataset": "Describe-Diff","subset_id": 0},
31
+ {"dataset": "NLVR2","subset_id": 0},
32
+ {"dataset": "NLVR2","subset_id": 1},
33
+ {"dataset": "KGQA","subset_id": 0}
34
+ ]
continuous/scenario-11.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "Bongard-HOI","subset_id": 150, "type":"multi-choice"},
6
+ {"dataset": "NLVR2","subset_id": 150, "type":"multi-choice"},
7
+ {"dataset": "Co-Instruct-DB","subset_id": 150, "type":"multi-choice"},
8
+ {"dataset": "TQA","subset_id": 150, "type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
continuous/scenario-12.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "NLVR2","subset_id": 151, "type":"multi-choice"},
6
+ {"dataset": "Bongard-HOI","subset_id": 151, "type":"multi-choice"},
7
+ {"dataset": "HQ_Edit","subset_id": 151, "type":"multi-choice"},
8
+ {"dataset": "PatternCom","subset_id": 151, "type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
continuous/scenario-14.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "Bongard-OpenWorld","subset_id": 153, "type":"multi-choice"},
6
+ {"dataset": "Co-Instruct-DB","subset_id": 153, "type":"multi-choice"},
7
+ {"dataset": "dvqa","subset_id": 153, "type":"multi-choice"},
8
+ {"dataset": "NLVR2","subset_id": 153, "type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
continuous/scenario-18.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "Bongard-OpenWorld","subset_id": 300, "type":"multi-choice"},
6
+ {"dataset": "Co-Instruct-DB","subset_id": 300, "type":"multi-choice"},
7
+ {"dataset": "dvqa","subset_id": 300, "type":"multi-choice"},
8
+ {"dataset": "HQ_Edit","subset_id": 300, "type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
continuous/scenario-5.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "Bongard-HOI","subset_id": 180, "type":"multi-choice"},
6
+ {"dataset": "Bongard-HOI","subset_id": 181, "type":"multi-choice"},
7
+ {"dataset": "Bongard-HOI","subset_id": 182, "type":"multi-choice"},
8
+ {"dataset": "Bongard-HOI","subset_id": 183, "type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
continuous/scenario-8.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "NLVR2","subset_id": 152, "type":"multi-choice"},
6
+ {"dataset": "HQ_Edit","subset_id": 152, "type":"multi-choice"},
7
+ {"dataset": "PatternCom","subset_id": 152, "type":"multi-choice"},
8
+ {"dataset": "Bongard-HOI","subset_id": 152, "type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
create_scenario.py ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import random
2
+ import os
3
+ import argparse
4
+ import json
5
+
6
+ def main():
7
+ # Create ArgumentParser object
8
+ parser = argparse.ArgumentParser()
9
+
10
+ # Add the method_name argument
11
+ parser.add_argument('--seed', type=int, default=0, help='Random seed')
12
+ parser.add_argument('--client_num', type=int, help='Number of client')
13
+ parser.add_argument('--max_task', type=int, default=4, help='Maximum number of tasks per client')
14
+
15
+ # Parse the command-line arguments
16
+ args = parser.parse_args()
17
+
18
+ random.seed(args.seed)
19
+
20
+ with open('./all_tasks.json', 'r') as fp:
21
+ task_list = json.load(fp)
22
+
23
+ print('total available tasks:', len(task_list))
24
+
25
+ max_task_per_client = min(args.max_task, len(task_list) // args.client_num)
26
+ scenario_data = []
27
+
28
+ random.shuffle(task_list)
29
+
30
+ for client_id in range(args.client_num):
31
+ scenario_data.append({
32
+ 'client_id':client_id,
33
+ 'datasets':task_list[client_id*max_task_per_client:(client_id+1)*max_task_per_client]
34
+ })
35
+
36
+ output_path = f'scenario_{args.client_num}clients_{max_task_per_client}tasks_seed{args.seed}.json'
37
+
38
+ with open(output_path, 'w') as json_file:
39
+ json.dump(scenario_data, json_file, indent=4)
40
+
41
+ if __name__ == "__main__":
42
+ main()
disjoint/scenario-1.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "HRVQA","subset_id": 100, "type":"multi-choice"}
6
+ ]
7
+ }
8
+ ]
disjoint/scenario-10.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "Co-Instruct-DB","subset_id": 0, "type":"multi-choice"},
6
+ {"dataset": "Co-Instruct-DB","subset_id": 1, "type":"multi-choice"},
7
+ {"dataset": "Co-Instruct-DB","subset_id": 2, "type":"open-ended", "metric":"RougeL"},
8
+ {"dataset": "Co-Instruct-DB","subset_id": 3, "type":"open-ended", "metric":"RougeL"}
9
+ ]
10
+ }
11
+ ]
disjoint/scenario-102.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "DreamSim","subset_id": 0, "type":"multi-choice"}
6
+ ]
7
+ }
8
+ ]
disjoint/scenario-103.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "RecipeQA_TextCloze","subset_id": 0, "type":"multi-choice"}
6
+ ]
7
+ }
8
+ ]
disjoint/scenario-104.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "MagicBrush","subset_id": 0, "type":"multi-choice"}
6
+ ]
7
+ }
8
+ ]
disjoint/scenario-105.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "COMICS_Panel","subset_id": 0, "type":"multi-choice"}
6
+ ]
7
+ }
8
+ ]
disjoint/scenario-106.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "RecipeQA_ImageCoherence","subset_id": 0, "type":"multi-choice"}
6
+ ]
7
+ }
8
+ ]
disjoint/scenario-107.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "Mantis_contrastive_caption","subset_id": 0, "type":"multi-choice"}
6
+ ]
7
+ }
8
+ ]
disjoint/scenario-11.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "Bongard-HOI","subset_id": 50, "type":"multi-choice"},
6
+ {"dataset": "NLVR2","subset_id": 0, "type":"multi-choice"},
7
+ {"dataset": "Co-Instruct-DB","subset_id": 0, "type":"multi-choice"},
8
+ {"dataset": "TQA","subset_id": 0, "type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
disjoint/scenario-12.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "NLVR2-2","subset_id": 0, "type":"multi-choice"},
6
+ {"dataset": "Bongard-HOI2","subset_id": 50, "type":"multi-choice"},
7
+ {"dataset": "HQ_Edit-2","subset_id": 0, "type":"multi-choice"},
8
+ {"dataset": "PatternCom-2","subset_id": 0, "type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
disjoint/scenario-14.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "Bongard-OpenWorld","subset_id": 1, "type":"multi-choice"},
6
+ {"dataset": "Co-Instruct-DB","subset_id": 0, "type":"multi-choice"},
7
+ {"dataset": "dvqa","subset_id": 0, "type":"multi-choice"},
8
+ {"dataset": "NLVR2","subset_id": 0, "type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
disjoint/scenario-15.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "ScienceQA","subset_id": 4, "type":"onlyLang"},
6
+ {"dataset": "TextVQA","subset_id": 6, "type":"ocr"},
7
+ {"dataset": "ImageNet","subset_id": 4, "type":"classification"},
8
+ {"dataset": "GQA","subset_id": 4, "type":"truth-alignment"},
9
+ {"dataset": "VizWiz2","subset_id": 4, "type":"truth-alignment"},
10
+ {"dataset": "COCO2014","subset_id": 4, "type":"grounding"},
11
+ {"dataset": "COCO2014","subset_id": 5, "type":"truth-alignment"},
12
+ {"dataset": "OCR-VQA","subset_id": 4, "type":"truth-alignment"}
13
+ ]
14
+ }
15
+ ]
disjoint/scenario-16.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "M3IT","subset_id": 3, "type":"open-ended", "metric":"accuracy"},
6
+ {"dataset": "MANTIS","subset_id": 2, "type":"open-ended", "metric":"accuracy"},
7
+ {"dataset": "LaMM","subset_id": 2, "type":"open-ended", "metric":"accuracy"},
8
+ {"dataset": "VisionFLAN","subset_id": 2, "type":"open-ended", "metric":"accuracy"}
9
+ ]
10
+ }
11
+ ]
disjoint/scenario-17.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "Bongard-OpenWorld","subset_id": 99, "type":"multi-choice"},
6
+ {"dataset": "NLVR2-2","subset_id": 99, "type":"multi-choice"},
7
+ {"dataset": "Co-Instruct-DB2","subset_id": 99, "type":"multi-choice"},
8
+ {"dataset": "Bongard-HOI","subset_id": 99, "type":"multi-choice"},
9
+ {"dataset": "PatternCom-2","subset_id": 99, "type":"multi-choice"},
10
+ {"dataset": "dvqa2","subset_id": 99, "type":"multi-choice"},
11
+ {"dataset": "HQ_Edit2","subset_id": 99, "type":"multi-choice"}
12
+ ]
13
+ }
14
+ ]
disjoint/scenario-18.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "Bongard-OpenWorld","subset_id": 3, "type":"multi-choice"},
6
+ {"dataset": "Co-Instruct-DB","subset_id": 0, "type":"multi-choice"},
7
+ {"dataset": "dvqa","subset_id": 0, "type":"multi-choice"},
8
+ {"dataset": "HQ_Edit","subset_id": 0, "type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
disjoint/scenario-2.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "HRVQA","subset_id": 1, "type":"multi-choice"},
6
+ {"dataset": "Bongard-HOI","subset_id": 1, "type":"multi-choice"},
7
+ {"dataset": "mPLUG","subset_id": 0, "type":"open-ended"},
8
+ {"dataset": "NLVR2","subset_id": 0,"type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
disjoint/scenario-20.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "ChartQA2","subset_id": 0, "type":"open-ended", "metric":"accuracy"},
6
+ {"dataset": "DocVQA2","subset_id": 0, "type":"open-ended", "metric":"accuracy"},
7
+ {"dataset": "iconqa2","subset_id": 0, "type":"open-ended", "metric":"accuracy"},
8
+ {"dataset": "PathVQA2","subset_id": 0, "type":"open-ended", "metric":"accuracy"}
9
+ ]
10
+ }
11
+ ]
disjoint/scenario-22.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "PatternCom-2","subset_id": 0, "type":"multi-choice"},
6
+ {"dataset": "NLVR2-2","subset_id": 0, "type":"multi-choice"},
7
+ {"dataset": "HQ_Edit-2","subset_id": 0, "type":"multi-choice"},
8
+ {"dataset": "Bongard-HOI2","subset_id": 50, "type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
disjoint/scenario-28.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "HQ_Edit","subset_id": 0, "type":"multi-choice"},
6
+ {"dataset": "Bongard-OpenWorld","subset_id": 3, "type":"multi-choice"},
7
+ {"dataset": "dvqa","subset_id": 0, "type":"multi-choice"},
8
+ {"dataset": "Co-Instruct-DB","subset_id": 0, "type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
disjoint/scenario-3.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "HRVQA","subset_id": 1, "type":"multi-choice"},
6
+ {"dataset": "HRVQA","subset_id": 5, "type":"multi-choice"},
7
+ {"dataset": "HRVQA","subset_id": 6, "type":"multi-choice"},
8
+ {"dataset": "HRVQA","subset_id": 9, "type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
disjoint/scenario-32.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "HQ_Edit-2","subset_id": 0, "type":"multi-choice"},
6
+ {"dataset": "PatternCom-2","subset_id": 0, "type":"multi-choice"},
7
+ {"dataset": "Bongard-HOI2","subset_id": 50, "type":"multi-choice"},
8
+ {"dataset": "NLVR2-2","subset_id": 0, "type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
disjoint/scenario-38.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "dvqa","subset_id": 0, "type":"multi-choice"},
6
+ {"dataset": "HQ_Edit","subset_id": 0, "type":"multi-choice"},
7
+ {"dataset": "Bongard-OpenWorld","subset_id": 3, "type":"multi-choice"},
8
+ {"dataset": "Co-Instruct-DB","subset_id": 0, "type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
disjoint/scenario-4.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "HRVQA","subset_id": 100, "type":"multi-choice"},
6
+ {"dataset": "Bongard-HOI","subset_id": 100, "type":"multi-choice"},
7
+ {"dataset": "mPLUG","subset_id": 100, "type":"open-ended"},
8
+ {"dataset": "NLVR2","subset_id": 100,"type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
disjoint/scenario-5.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "Bongard-HOI","subset_id": 50, "type":"multi-choice"},
6
+ {"dataset": "Bongard-HOI","subset_id": 51, "type":"multi-choice"},
7
+ {"dataset": "Bongard-HOI","subset_id": 52, "type":"multi-choice"},
8
+ {"dataset": "Bongard-HOI","subset_id": 53, "type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
disjoint/scenario-6.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "Bongard-HOI","subset_id": 90, "type":"multi-choice"}
6
+ ]
7
+ }
8
+ ]
disjoint/scenario-7.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "WebQA","subset_id": 0, "type":"multi-choice"},
6
+ {"dataset": "AQUA","subset_id": 0, "type":"multi-choice"},
7
+ {"dataset": "TQA","subset_id": 0, "type":"multi-choice"},
8
+ {"dataset": "dvqa","subset_id": 0, "type":"multi-choice"}
9
+
10
+ ]
11
+ }
12
+ ]
disjoint/scenario-8.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "NLVR2","subset_id": 0, "type":"multi-choice"},
6
+ {"dataset": "HQ_Edit","subset_id": 0, "type":"multi-choice"},
7
+ {"dataset": "PatternCom","subset_id": 0, "type":"multi-choice"},
8
+ {"dataset": "Bongard-HOI","subset_id": 2, "type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
disjoint/scenario-9.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "dvqa","subset_id": 0, "type":"multi-choice"},
6
+ {"dataset": "HQ_Edit","subset_id": 0, "type":"multi-choice"},
7
+ {"dataset": "TQA","subset_id": 0, "type":"multi-choice"},
8
+ {"dataset": "PatternCom","subset_id": 0, "type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
fcl_scenarios/scenario-0.json ADDED
@@ -0,0 +1,92 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "Fashion200K","subset_id": 0, "type":"multi-choice"},
6
+ {"dataset": "Fashion200K","subset_id": 2, "type":"multi-choice"},
7
+ {"dataset": "Fashion200K","subset_id": 3, "type":"multi-choice"},
8
+ {"dataset": "FashionIQ","subset_id": 0, "type":"multi-choice"}
9
+ ]
10
+ },
11
+ {
12
+ "client_id": 1,
13
+ "datasets":[
14
+ {"dataset": "HRVQA","subset_id": 2, "type":"multi-choice"},
15
+ {"dataset": "HRVQA","subset_id": 5, "type":"multi-choice"},
16
+ {"dataset": "HRVQA","subset_id": 7, "type":"multi-choice"},
17
+ {"dataset": "HRVQA","subset_id": 9, "type":"multi-choice"}
18
+ ]
19
+ },
20
+ {
21
+ "client_id": 2,
22
+ "datasets":[
23
+ {"dataset": "NLVR2","subset_id": 0,"type":"multi-choice"},
24
+ {"dataset": "CIRR","subset_id": 1,"type":"multi-choice"},
25
+ {"dataset": "HQ_Edit","subset_id": 0,"type":"multi-choice"},
26
+ {"dataset": "PatternCom","subset_id": 0,"type":"multi-choice"}
27
+ ]
28
+ },
29
+ {
30
+ "client_id": 3,
31
+ "datasets":[
32
+ {"dataset": "WebQA","subset_id": 0, "type":"open-ended", "metric":"F1"},
33
+ {"dataset": "TQA","subset_id": 0, "type":"multi-choice"},
34
+ {"dataset": "AQUA","subset_id": 0, "type":"open-ended", "metric":"F1"},
35
+ {"dataset": "dvqa","subset_id": 0, "type":"multi-choice"}
36
+ ]
37
+ },
38
+ {
39
+ "client_id": 4,
40
+ "datasets":[
41
+ {"dataset": "Bongard-OpenWorld","subset_id": 3, "type":"multi-choice"},
42
+ {"dataset": "Bongard-OpenWorld","subset_id": 1, "type":"multi-choice"},
43
+ {"dataset": "Bongard-HOI","subset_id": 0, "type":"multi-choice"},
44
+ {"dataset": "Bongard-HOI","subset_id": 1, "type":"multi-choice"}
45
+ ]
46
+ },
47
+ {
48
+ "client_id": 5,
49
+ "datasets":[
50
+ {"dataset": "iconqa","subset_id": 0, "type":"multi-choice"},
51
+ {"dataset": "iconqa","subset_id": 1, "type":"multi-choice"},
52
+ {"dataset": "iconqa","subset_id": 2, "type":"open-ended", "metric":"F1"},
53
+ {"dataset": "iconqa","subset_id": 3, "type":"open-ended", "metric":"F1"}
54
+ ]
55
+ },
56
+ {
57
+ "client_id": 6,
58
+ "datasets":[
59
+ {"dataset": "Co-Instruct-DB","subset_id": 0, "type":"multi-choice"},
60
+ {"dataset": "Co-Instruct-DB","subset_id": 1, "type":"multi-choice"},
61
+ {"dataset": "Co-Instruct-DB","subset_id": 2, "type":"open-ended", "metric":"RougeL"},
62
+ {"dataset": "Co-Instruct-DB","subset_id": 3, "type":"open-ended", "metric":"RougeL"}
63
+ ]
64
+ },
65
+ {
66
+ "client_id": 7,
67
+ "datasets":[
68
+ {"dataset": "Spot-the-Diff","subset_id": 0, "type":"open-ended", "metric":"RougeL"},
69
+ {"dataset": "Birds-to-Words","subset_id": 0, "type":"open-ended", "metric":"RougeL"},
70
+ {"dataset": "IEdit","subset_id": 0, "type":"open-ended", "metric":"RougeL"},
71
+ {"dataset": "CLEVR-Change","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
72
+ ]
73
+ },
74
+ {
75
+ "client_id": 8,
76
+ "datasets":[
77
+ {"dataset": "PororoSV","subset_id": 0, "type":"open-ended", "metric":"RougeL"},
78
+ {"dataset": "FlintstonesSV","subset_id": 0, "type":"open-ended", "metric":"RougeL"},
79
+ {"dataset": "VIST","subset_id": 0, "type":"open-ended", "metric":"RougeL"},
80
+ {"dataset": "AESOP","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
81
+ ]
82
+ },
83
+ {
84
+ "client_id": 9,
85
+ "datasets":[
86
+ {"dataset": "VISION","subset_id": 0, "type":"multi-choice"},
87
+ {"dataset": "VISION","subset_id": 1, "type":"multi-choice"},
88
+ {"dataset": "VizWiz","subset_id": 0, "type":"multi-choice"},
89
+ {"dataset": "MIT-States","subset_id": 0, "type":"multi-choice"}
90
+ ]
91
+ }
92
+ ]
fcl_scenarios/scenario-1.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "HRVQA","subset_id": 1, "type":"multi-choice"},
6
+ {"dataset": "HRVQA","subset_id": 6, "type":"multi-choice"},
7
+ {"dataset": "iconqa","subset_id": 4, "type":"multi-choice"},
8
+ {"dataset": "ALFRED","subset_id": 0, "type":"open-ended", "metric":"RougeL"},
9
+ {"dataset": "DiDeMoSV","subset_id": 0, "type":"open-ended", "metric":"RougeL"},
10
+ {"dataset": "COMICS_Dialogue","subset_id": 0, "type":"multi-choice"},
11
+ {"dataset": "RecipeQA_ImageCoherence","subset_id": 0,"type":"multi-choice"}
12
+ ]
13
+ }
14
+ ]
fcl_scenarios/scenario-10.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "DreamSim","subset_id": 0,"type":"multi-choice"}
6
+ ]
7
+ },
8
+ {
9
+ "client_id": 1,
10
+ "datasets":[
11
+ {"dataset": "Mementos","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
12
+ ]
13
+ },
14
+ {
15
+ "client_id": 2,
16
+ "datasets":[
17
+ {"dataset": "Bongard-HOI","subset_id": 2, "type":"multi-choice"}
18
+ ]
19
+ },
20
+ {
21
+ "client_id": 3,
22
+ "datasets":[
23
+ {"dataset": "Co-Instruct-DB","subset_id": 8, "type":"multi-choice"}
24
+ ]
25
+ }
26
+ ]
fcl_scenarios/scenario-2.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "ALFRED","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
6
+ ]
7
+ },
8
+ {
9
+ "client_id": 1,
10
+ "datasets":[
11
+ {"dataset": "DiDeMoSV","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
12
+ ]
13
+ },
14
+ {
15
+ "client_id": 2,
16
+ "datasets":[
17
+ {"dataset": "COMICS_Dialogue","subset_id": 0, "type":"multi-choice"}
18
+ ]
19
+ },
20
+ {
21
+ "client_id": 3,
22
+ "datasets":[
23
+ {"dataset": "RecipeQA_ImageCoherence","subset_id": 0,"type":"multi-choice"}
24
+ ]
25
+ }
26
+ ]
fcl_scenarios/scenario-20.json ADDED
@@ -0,0 +1,92 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "RecipeQA_TextCloze","subset_id": 0, "type":"multi-choice"},
6
+ {"dataset": "RecipeQA_VisualCloze","subset_id": 0, "type":"multi-choice"},
7
+ {"dataset": "COMICS_Dialogue","subset_id": 0, "type":"multi-choice"},
8
+ {"dataset": "COMICS_Panel","subset_id": 0, "type":"multi-choice"}
9
+ ]
10
+ },
11
+ {
12
+ "client_id": 1,
13
+ "datasets":[
14
+ {"dataset": "HRVQA","subset_id": 1, "type":"multi-choice"},
15
+ {"dataset": "HRVQA","subset_id": 5, "type":"multi-choice"},
16
+ {"dataset": "HRVQA","subset_id": 6, "type":"multi-choice"},
17
+ {"dataset": "HRVQA","subset_id": 9, "type":"multi-choice"}
18
+ ]
19
+ },
20
+ {
21
+ "client_id": 2,
22
+ "datasets":[
23
+ {"dataset": "Fashion200K","subset_id": 0,"type":"multi-choice"},
24
+ {"dataset": "Fashion200K","subset_id": 1,"type":"multi-choice"},
25
+ {"dataset": "RecipeQA_ImageCoherence","subset_id": 0,"type":"multi-choice"},
26
+ {"dataset": "NLVR2","subset_id": 0,"type":"multi-choice"}
27
+ ]
28
+ },
29
+ {
30
+ "client_id": 3,
31
+ "datasets":[
32
+ {"dataset": "WebQA","subset_id": 0, "type":"open-ended"},
33
+ {"dataset": "TQA","subset_id": 0, "type":"multi-choice"},
34
+ {"dataset": "AQUA","subset_id": 0, "type":"open-ended"},
35
+ {"dataset": "AQUA","subset_id": 1, "type":"open-ended"}
36
+ ]
37
+ },
38
+ {
39
+ "client_id": 4,
40
+ "datasets":[
41
+ {"dataset": "Bongard-OpenWorld","subset_id": 0, "type":"open-ended"},
42
+ {"dataset": "Bongard-OpenWorld","subset_id": 1, "type":"multi-choice"},
43
+ {"dataset": "Bongard-HOI","subset_id": 0, "type":"multi-choice"},
44
+ {"dataset": "Bongard-HOI","subset_id": 1, "type":"multi-choice"}
45
+ ]
46
+ },
47
+ {
48
+ "client_id": 5,
49
+ "datasets":[
50
+ {"dataset": "HRVQA","subset_id": 2, "type":"multi-choice"},
51
+ {"dataset": "HRVQA","subset_id": 4, "type":"multi-choice"},
52
+ {"dataset": "HRVQA","subset_id": 7, "type":"multi-choice"},
53
+ {"dataset": "HRVQA","subset_id": 8, "type":"multi-choice"}
54
+ ]
55
+ },
56
+ {
57
+ "client_id": 6,
58
+ "datasets":[
59
+ {"dataset": "mPLUG","subset_id": 0, "type":"open-ended"},
60
+ {"dataset": "mPLUG","subset_id": 1, "type":"open-ended"},
61
+ {"dataset": "mPLUG","subset_id": 2, "type":"open-ended"},
62
+ {"dataset": "mPLUG","subset_id": 4, "type":"open-ended"}
63
+ ]
64
+ },
65
+ {
66
+ "client_id": 7,
67
+ "datasets":[
68
+ {"dataset": "Spot-the-Diff","subset_id": 0, "type":"open-ended"},
69
+ {"dataset": "Birds-to-Words","subset_id": 0, "type":"open-ended"},
70
+ {"dataset": "IEdit","subset_id": 0, "type":"open-ended"},
71
+ {"dataset": "CLEVR-Change","subset_id": 0, "type":"open-ended"}
72
+ ]
73
+ },
74
+ {
75
+ "client_id": 8,
76
+ "datasets":[
77
+ {"dataset": "PororoSV","subset_id": 0, "type":"open-ended"},
78
+ {"dataset": "FlintstonesSV","subset_id": 0, "type":"open-ended"},
79
+ {"dataset": "VIST","subset_id": 0, "type":"open-ended"},
80
+ {"dataset": "AESOP","subset_id": 0, "type":"open-ended"}
81
+ ]
82
+ },
83
+ {
84
+ "client_id": 9,
85
+ "datasets":[
86
+ {"dataset": "VISION","subset_id": 0, "type":"multi-choice"},
87
+ {"dataset": "VISION","subset_id": 1, "type":"multi-choice"},
88
+ {"dataset": "VizWiz","subset_id": 0, "type":"multi-choice"},
89
+ {"dataset": "MIT-States","subset_id": 0, "type":"multi-choice"}
90
+ ]
91
+ }
92
+ ]
fcl_scenarios/scenario-21.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "Fashion200K","subset_id": 0,"type":"multi-choice"},
6
+ {"dataset": "Fashion200K","subset_id": 1,"type":"multi-choice"},
7
+ {"dataset": "RecipeQA_ImageCoherence","subset_id": 0,"type":"multi-choice"},
8
+ {"dataset": "NLVR2","subset_id": 0,"type":"multi-choice"}
9
+ ]
10
+ },
11
+ {
12
+ "client_id": 1,
13
+ "datasets":[
14
+ {"dataset": "VISION","subset_id": 0, "type":"multi-choice"},
15
+ {"dataset": "VISION","subset_id": 1, "type":"multi-choice"},
16
+ {"dataset": "VizWiz","subset_id": 0, "type":"multi-choice"},
17
+ {"dataset": "MIT-States","subset_id": 0, "type":"multi-choice"}
18
+ ]
19
+ }
20
+ ]
fcl_scenarios/scenario-22.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "RecipeQA_TextCloze","subset_id": 0, "type":"multi-choice"},
6
+ {"dataset": "RecipeQA_VisualCloze","subset_id": 0, "type":"multi-choice"},
7
+ {"dataset": "COMICS_Dialogue","subset_id": 0, "type":"multi-choice"},
8
+ {"dataset": "COMICS_Panel","subset_id": 0, "type":"multi-choice"}
9
+ ]
10
+ },
11
+ {
12
+ "client_id": 1,
13
+ "datasets":[
14
+ {"dataset": "Fashion200K","subset_id": 0,"type":"multi-choice"},
15
+ {"dataset": "Fashion200K","subset_id": 1,"type":"multi-choice"},
16
+ {"dataset": "RecipeQA_ImageCoherence","subset_id": 0,"type":"multi-choice"},
17
+ {"dataset": "NLVR2","subset_id": 0,"type":"multi-choice"}
18
+ ]
19
+ },
20
+ {
21
+ "client_id": 2,
22
+ "datasets":[
23
+ {"dataset": "Bongard-OpenWorld","subset_id": 0, "type":"open-ended"},
24
+ {"dataset": "Bongard-OpenWorld","subset_id": 1, "type":"multi-choice"},
25
+ {"dataset": "Bongard-HOI","subset_id": 0, "type":"multi-choice"},
26
+ {"dataset": "Bongard-HOI","subset_id": 1, "type":"multi-choice"}
27
+ ]
28
+ },
29
+ {
30
+ "client_id": 3,
31
+ "datasets":[
32
+ {"dataset": "VISION","subset_id": 0, "type":"multi-choice"},
33
+ {"dataset": "VISION","subset_id": 1, "type":"multi-choice"},
34
+ {"dataset": "VizWiz","subset_id": 0, "type":"multi-choice"},
35
+ {"dataset": "MIT-States","subset_id": 0, "type":"multi-choice"}
36
+ ]
37
+ }
38
+ ]
fcl_scenarios/scenario-23.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "RecipeQA_TextCloze","subset_id": 0, "type":"multi-choice"},
6
+ {"dataset": "RecipeQA_VisualCloze","subset_id": 0, "type":"multi-choice"},
7
+ {"dataset": "COMICS_Dialogue","subset_id": 0, "type":"multi-choice"},
8
+ {"dataset": "COMICS_Panel","subset_id": 0, "type":"multi-choice"}
9
+ ]
10
+ }
11
+ ]
fcl_scenarios/scenario-24.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "Fashion200K","subset_id": 0,"type":"multi-choice"},
6
+ {"dataset": "Fashion200K","subset_id": 1,"type":"multi-choice"},
7
+ {"dataset": "RecipeQA_ImageCoherence","subset_id": 0,"type":"multi-choice"},
8
+ {"dataset": "NLVR2","subset_id": 0,"type":"multi-choice"}
9
+ ]
10
+ },
11
+ {
12
+ "client_id": 1,
13
+ "datasets":[
14
+ {"dataset": "VISION","subset_id": 0, "type":"multi-choice"},
15
+ {"dataset": "VISION","subset_id": 1, "type":"multi-choice"},
16
+ {"dataset": "VizWiz","subset_id": 0, "type":"multi-choice"},
17
+ {"dataset": "MIT-States","subset_id": 0, "type":"multi-choice"}
18
+ ]
19
+ }
20
+ ]
fcl_scenarios/scenario-28.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "HRVQA","subset_id": 1, "type":"multi-choice"},
6
+ {"dataset": "HRVQA","subset_id": 5, "type":"multi-choice"},
7
+ {"dataset": "HRVQA","subset_id": 6, "type":"multi-choice"},
8
+ {"dataset": "HRVQA","subset_id": 9, "type":"multi-choice"}
9
+ ]
10
+ },
11
+ {
12
+ "client_id": 1,
13
+ "datasets":[
14
+ {"dataset": "WebQA","subset_id": 0, "type":"open-ended"},
15
+ {"dataset": "TQA","subset_id": 0, "type":"multi-choice"},
16
+ {"dataset": "AQUA","subset_id": 0, "type":"open-ended"},
17
+ {"dataset": "AQUA","subset_id": 1, "type":"open-ended"}
18
+ ]
19
+ },
20
+ {
21
+ "client_id": 2,
22
+ "datasets":[
23
+ {"dataset": "Spot-the-Diff","subset_id": 0, "type":"open-ended"},
24
+ {"dataset": "Birds-to-Words","subset_id": 0, "type":"open-ended"},
25
+ {"dataset": "IEdit","subset_id": 0, "type":"open-ended"},
26
+ {"dataset": "CLEVR-Change","subset_id": 0, "type":"open-ended"}
27
+ ]
28
+ },
29
+ {
30
+ "client_id": 3,
31
+ "datasets":[
32
+ {"dataset": "VISION","subset_id": 0, "type":"multi-choice"},
33
+ {"dataset": "VISION","subset_id": 1, "type":"multi-choice"},
34
+ {"dataset": "VizWiz","subset_id": 0, "type":"multi-choice"},
35
+ {"dataset": "MIT-States","subset_id": 0, "type":"multi-choice"}
36
+ ]
37
+ }
38
+ ]
fcl_scenarios/scenario-29.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "RecipeQA_TextCloze","subset_id": 0, "type":"multi-choice"},
6
+ {"dataset": "RecipeQA_VisualCloze","subset_id": 0, "type":"multi-choice"},
7
+ {"dataset": "COMICS_Dialogue","subset_id": 0, "type":"multi-choice"},
8
+ {"dataset": "COMICS_Panel","subset_id": 0, "type":"multi-choice"}
9
+ ]
10
+ },
11
+ {
12
+ "client_id": 1,
13
+ "datasets":[
14
+ {"dataset": "HRVQA","subset_id": 1, "type":"multi-choice"},
15
+ {"dataset": "HRVQA","subset_id": 5, "type":"multi-choice"},
16
+ {"dataset": "HRVQA","subset_id": 6, "type":"multi-choice"},
17
+ {"dataset": "HRVQA","subset_id": 9, "type":"multi-choice"}
18
+ ]
19
+ },
20
+ {
21
+ "client_id": 2,
22
+ "datasets":[
23
+ {"dataset": "Bongard-OpenWorld","subset_id": 0, "type":"open-ended"},
24
+ {"dataset": "Bongard-OpenWorld","subset_id": 1, "type":"multi-choice"},
25
+ {"dataset": "Bongard-HOI","subset_id": 0, "type":"multi-choice"},
26
+ {"dataset": "Bongard-HOI","subset_id": 1, "type":"multi-choice"}
27
+ ]
28
+ },
29
+ {
30
+ "client_id": 3,
31
+ "datasets":[
32
+ {"dataset": "PororoSV","subset_id": 0, "type":"open-ended"},
33
+ {"dataset": "FlintstonesSV","subset_id": 0, "type":"open-ended"},
34
+ {"dataset": "VIST","subset_id": 0, "type":"open-ended"},
35
+ {"dataset": "AESOP","subset_id": 0, "type":"open-ended"}
36
+ ]
37
+ }
38
+ ]
fcl_scenarios/scenario-3.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "mPLUG","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
6
+ ]
7
+ },
8
+ {
9
+ "client_id": 1,
10
+ "datasets":[
11
+ {"dataset": "iconqa","subset_id": 4, "type":"multi-choice"}
12
+ ]
13
+ },
14
+ {
15
+ "client_id": 2,
16
+ "datasets":[
17
+ {"dataset": "RecipeQA_TextCloze","subset_id": 0, "type":"multi-choice"}
18
+ ]
19
+ }
20
+ ]
fcl_scenarios/scenario-4.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "mPLUG","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
6
+ ]
7
+ },
8
+ {
9
+ "client_id": 1,
10
+ "datasets":[
11
+ {"dataset": "iconqa","subset_id": 4, "type":"multi-choice"}
12
+ ]
13
+ }
14
+ ]
fcl_scenarios/scenario-40.json ADDED
@@ -0,0 +1,242 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "client_id": 0,
4
+ "datasets":[
5
+ {"dataset": "Fashion200K","subset_id": 0, "type":"multi-choice"}
6
+ ]
7
+ },
8
+ {
9
+ "client_id": 1,
10
+ "datasets":[
11
+ {"dataset": "Fashion200K","subset_id": 2, "type":"multi-choice"}
12
+ ]
13
+ },
14
+ {
15
+ "client_id": 2,
16
+ "datasets":[
17
+ {"dataset": "Fashion200K","subset_id": 3, "type":"multi-choice"}
18
+ ]
19
+ },
20
+ {
21
+ "client_id": 3,
22
+ "datasets":[
23
+ {"dataset": "FashionIQ","subset_id": 0, "type":"multi-choice"}
24
+ ]
25
+ },
26
+ {
27
+ "client_id": 4,
28
+ "datasets":[
29
+ {"dataset": "HRVQA","subset_id": 2, "type":"multi-choice"}
30
+ ]
31
+ },
32
+ {
33
+ "client_id": 5,
34
+ "datasets":[
35
+ {"dataset": "HRVQA","subset_id": 5, "type":"multi-choice"}
36
+ ]
37
+ },
38
+ {
39
+ "client_id": 6,
40
+ "datasets":[
41
+ {"dataset": "HRVQA","subset_id": 7, "type":"multi-choice"}
42
+ ]
43
+ },
44
+ {
45
+ "client_id": 7,
46
+ "datasets":[
47
+ {"dataset": "HRVQA","subset_id": 9, "type":"multi-choice"}
48
+ ]
49
+ },
50
+ {
51
+ "client_id": 8,
52
+ "datasets":[
53
+ {"dataset": "NLVR2","subset_id": 0,"type":"multi-choice"}
54
+ ]
55
+ },
56
+ {
57
+ "client_id": 9,
58
+ "datasets":[
59
+ {"dataset": "CIRR","subset_id": 1,"type":"multi-choice"}
60
+ ]
61
+ },
62
+ {
63
+ "client_id": 10,
64
+ "datasets":[
65
+ {"dataset": "HQ_Edit","subset_id": 0,"type":"multi-choice"}
66
+ ]
67
+ },
68
+ {
69
+ "client_id": 11,
70
+ "datasets":[
71
+ {"dataset": "PatternCom","subset_id": 0,"type":"multi-choice"}
72
+ ]
73
+ },
74
+ {
75
+ "client_id": 12,
76
+ "datasets":[
77
+ {"dataset": "WebQA","subset_id": 0, "type":"open-ended", "metric":"F1"}
78
+ ]
79
+ },
80
+ {
81
+ "client_id": 13,
82
+ "datasets":[
83
+ {"dataset": "TQA","subset_id": 0, "type":"multi-choice"}
84
+ ]
85
+ },
86
+ {
87
+ "client_id": 14,
88
+ "datasets":[
89
+ {"dataset": "AQUA","subset_id": 0, "type":"open-ended", "metric":"F1"}
90
+ ]
91
+ },
92
+ {
93
+ "client_id": 15,
94
+ "datasets":[
95
+ {"dataset": "dvqa","subset_id": 0, "type":"multi-choice"}
96
+ ]
97
+ },
98
+ {
99
+ "client_id": 16,
100
+ "datasets":[
101
+ {"dataset": "Bongard-OpenWorld","subset_id": 3, "type":"multi-choice"}
102
+ ]
103
+ },
104
+ {
105
+ "client_id": 17,
106
+ "datasets":[
107
+ {"dataset": "Bongard-OpenWorld","subset_id": 1, "type":"multi-choice"}
108
+ ]
109
+ },
110
+ {
111
+ "client_id": 18,
112
+ "datasets":[
113
+ {"dataset": "Bongard-HOI","subset_id": 0, "type":"multi-choice"}
114
+ ]
115
+ },
116
+ {
117
+ "client_id": 19,
118
+ "datasets":[
119
+ {"dataset": "Bongard-HOI","subset_id": 1, "type":"multi-choice"}
120
+ ]
121
+ },
122
+ {
123
+ "client_id": 20,
124
+ "datasets":[
125
+ {"dataset": "iconqa","subset_id": 0, "type":"multi-choice"}
126
+ ]
127
+ },
128
+ {
129
+ "client_id": 21,
130
+ "datasets":[
131
+ {"dataset": "iconqa","subset_id": 1, "type":"multi-choice"}
132
+ ]
133
+ },
134
+ {
135
+ "client_id": 22,
136
+ "datasets":[
137
+ {"dataset": "iconqa","subset_id": 2, "type":"open-ended", "metric":"F1"}
138
+ ]
139
+ },
140
+ {
141
+ "client_id": 23,
142
+ "datasets":[
143
+ {"dataset": "iconqa","subset_id": 3, "type":"open-ended", "metric":"F1"}
144
+ ]
145
+ },
146
+ {
147
+ "client_id": 24,
148
+ "datasets":[
149
+ {"dataset": "Co-Instruct-DB","subset_id": 0, "type":"multi-choice"}
150
+ ]
151
+ },
152
+ {
153
+ "client_id": 25,
154
+ "datasets":[
155
+ {"dataset": "Co-Instruct-DB","subset_id": 1, "type":"multi-choice"}
156
+ ]
157
+ },
158
+ {
159
+ "client_id": 26,
160
+ "datasets":[
161
+ {"dataset": "Co-Instruct-DB","subset_id": 2, "type":"open-ended", "metric":"RougeL"}
162
+ ]
163
+ },
164
+ {
165
+ "client_id": 27,
166
+ "datasets":[
167
+ {"dataset": "Co-Instruct-DB","subset_id": 3, "type":"open-ended", "metric":"RougeL"}
168
+ ]
169
+ },
170
+ {
171
+ "client_id": 28,
172
+ "datasets":[
173
+ {"dataset": "Spot-the-Diff","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
174
+ ]
175
+ },
176
+ {
177
+ "client_id": 29,
178
+ "datasets":[
179
+ {"dataset": "Birds-to-Words","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
180
+ ]
181
+ },
182
+ {
183
+ "client_id": 30,
184
+ "datasets":[
185
+ {"dataset": "IEdit","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
186
+ ]
187
+ },
188
+ {
189
+ "client_id": 31,
190
+ "datasets":[
191
+ {"dataset": "CLEVR-Change","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
192
+ ]
193
+ },
194
+ {
195
+ "client_id": 32,
196
+ "datasets":[
197
+ {"dataset": "PororoSV","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
198
+ ]
199
+ },
200
+ {
201
+ "client_id": 33,
202
+ "datasets":[
203
+ {"dataset": "FlintstonesSV","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
204
+ ]
205
+ },
206
+ {
207
+ "client_id": 34,
208
+ "datasets":[
209
+ {"dataset": "VIST","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
210
+ ]
211
+ },
212
+ {
213
+ "client_id": 35,
214
+ "datasets":[
215
+ {"dataset": "AESOP","subset_id": 0, "type":"open-ended", "metric":"RougeL"}
216
+ ]
217
+ },
218
+ {
219
+ "client_id": 36,
220
+ "datasets":[
221
+ {"dataset": "VISION","subset_id": 0, "type":"multi-choice"}
222
+ ]
223
+ },
224
+ {
225
+ "client_id": 37,
226
+ "datasets":[
227
+ {"dataset": "VISION","subset_id": 1, "type":"multi-choice"}
228
+ ]
229
+ },
230
+ {
231
+ "client_id": 38,
232
+ "datasets":[
233
+ {"dataset": "VizWiz","subset_id": 0, "type":"multi-choice"}
234
+ ]
235
+ },
236
+ {
237
+ "client_id": 39,
238
+ "datasets":[
239
+ {"dataset": "MIT-States","subset_id": 0, "type":"multi-choice"}
240
+ ]
241
+ }
242
+ ]