zhuohan-7 commited on
Commit
71dd565
·
verified ·
1 Parent(s): e68738a

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. examples/aishell_asr_zh_test/data-00000-of-00001.arrow +3 -0
  2. examples/aishell_asr_zh_test/dataset_info.json +58 -0
  3. examples/aishell_asr_zh_test/state.json +13 -0
  4. examples/alpaca_audio_test/data-00000-of-00001.arrow +3 -0
  5. examples/alpaca_audio_test/dataset_info.json +49 -0
  6. examples/alpaca_audio_test/state.json +13 -0
  7. examples/audiocaps_qa_test/data-00000-of-00001.arrow +3 -0
  8. examples/audiocaps_qa_test/dataset_info.json +45 -0
  9. examples/audiocaps_qa_test/state.json +13 -0
  10. examples/audiocaps_test/data-00000-of-00001.arrow +3 -0
  11. examples/audiocaps_test/dataset_info.json +58 -0
  12. examples/audiocaps_test/state.json +13 -0
  13. examples/clotho_aqa_test/data-00000-of-00001.arrow +3 -0
  14. examples/clotho_aqa_test/dataset_info.json +58 -0
  15. examples/clotho_aqa_test/state.json +13 -0
  16. examples/cn_college_listen_mcq_test/data-00000-of-00001.arrow +3 -0
  17. examples/cn_college_listen_mcq_test/dataset_info.json +66 -0
  18. examples/cn_college_listen_mcq_test/state.json +13 -0
  19. examples/cna_test/data-00000-of-00001.arrow +3 -0
  20. examples/cna_test/dataset_info.json +20 -0
  21. examples/cna_test/state.json +13 -0
  22. examples/common_voice_15_en_test/data-00000-of-00001.arrow +3 -0
  23. examples/common_voice_15_en_test/dataset_info.json +28 -0
  24. examples/common_voice_15_en_test/state.json +19 -0
  25. examples/commonvoice_17_id_asr/data-00000-of-00001.arrow +3 -0
  26. examples/commonvoice_17_id_asr/dataset_info.json +132 -0
  27. examples/commonvoice_17_id_asr/state.json +13 -0
  28. examples/commonvoice_17_ta_asr/data-00000-of-00001.arrow +3 -0
  29. examples/commonvoice_17_ta_asr/dataset_info.json +156 -0
  30. examples/commonvoice_17_ta_asr/state.json +13 -0
  31. examples/commonvoice_17_th_asr/data-00000-of-00001.arrow +3 -0
  32. examples/commonvoice_17_th_asr/dataset_info.json +164 -0
  33. examples/commonvoice_17_th_asr/state.json +13 -0
  34. examples/commonvoice_17_vi_asr/data-00000-of-00001.arrow +3 -0
  35. examples/commonvoice_17_vi_asr/dataset_info.json +132 -0
  36. examples/commonvoice_17_vi_asr/state.json +13 -0
  37. examples/commonvoice_zh_asr/data-00000-of-00001.arrow +3 -0
  38. examples/commonvoice_zh_asr/dataset_info.json +182 -0
  39. examples/commonvoice_zh_asr/state.json +13 -0
  40. examples/covost2_en_id_test/data-00000-of-00001.arrow +3 -0
  41. examples/covost2_en_id_test/dataset_info.json +73 -0
  42. examples/covost2_en_id_test/state.json +13 -0
  43. examples/covost2_en_ta_test/data-00000-of-00001.arrow +3 -0
  44. examples/covost2_en_ta_test/dataset_info.json +73 -0
  45. examples/covost2_en_ta_test/state.json +13 -0
  46. examples/covost2_en_zh_test/data-00000-of-00001.arrow +3 -0
  47. examples/covost2_en_zh_test/dataset_info.json +73 -0
  48. examples/covost2_en_zh_test/state.json +13 -0
  49. examples/covost2_id_en_test/data-00000-of-00001.arrow +3 -0
  50. examples/covost2_id_en_test/dataset_info.json +45 -0
examples/aishell_asr_zh_test/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d8ed27441c9a5f6ac8b38e27b52ce555fe03322530ff16c16f2796c9f6e7f45
3
+ size 44296
examples/aishell_asr_zh_test/dataset_info.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "builder_name": "parquet",
3
+ "citation": "",
4
+ "config_name": "default",
5
+ "dataset_name": "aishell_asr_zh_test_v1",
6
+ "dataset_size": 1115469955,
7
+ "description": "",
8
+ "download_checksums": {
9
+ "hf://datasets/AudioLLMs/aishell_asr_zh_test_v1@e73dc7f096ecea5c8e5c722446c8d3b4014fdd18/data/test-00000-of-00003.parquet": {
10
+ "num_bytes": 364047728,
11
+ "checksum": null
12
+ },
13
+ "hf://datasets/AudioLLMs/aishell_asr_zh_test_v1@e73dc7f096ecea5c8e5c722446c8d3b4014fdd18/data/test-00001-of-00003.parquet": {
14
+ "num_bytes": 354834886,
15
+ "checksum": null
16
+ },
17
+ "hf://datasets/AudioLLMs/aishell_asr_zh_test_v1@e73dc7f096ecea5c8e5c722446c8d3b4014fdd18/data/test-00002-of-00003.parquet": {
18
+ "num_bytes": 377041689,
19
+ "checksum": null
20
+ }
21
+ },
22
+ "download_size": 1095924303,
23
+ "features": {
24
+ "context": {
25
+ "_type": "Audio"
26
+ },
27
+ "instruction": {
28
+ "dtype": "string",
29
+ "_type": "Value"
30
+ },
31
+ "answer": {
32
+ "dtype": "string",
33
+ "_type": "Value"
34
+ }
35
+ },
36
+ "homepage": "",
37
+ "license": "",
38
+ "size_in_bytes": 2211394258,
39
+ "splits": {
40
+ "test": {
41
+ "name": "test",
42
+ "num_bytes": 1115469955,
43
+ "num_examples": 6920,
44
+ "shard_lengths": [
45
+ 3207,
46
+ 3107,
47
+ 606
48
+ ],
49
+ "dataset_name": "aishell_asr_zh_test_v1"
50
+ }
51
+ },
52
+ "version": {
53
+ "version_str": "0.0.0",
54
+ "major": 0,
55
+ "minor": 0,
56
+ "patch": 0
57
+ }
58
+ }
examples/aishell_asr_zh_test/state.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "5a1f0f8b9b3ca365",
8
+ "_format_columns": null,
9
+ "_format_kwargs": {},
10
+ "_format_type": null,
11
+ "_output_all_columns": false,
12
+ "_split": null
13
+ }
examples/alpaca_audio_test/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acbe0fbf69f6732a358e6c6575354464b9c5e39b87be73cc9f1ae7c284e9e575
3
+ size 44600
examples/alpaca_audio_test/dataset_info.json ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "builder_name": "parquet",
3
+ "citation": "",
4
+ "config_name": "default",
5
+ "dataset_name": "alpaca_audio_test",
6
+ "dataset_size": 13865321,
7
+ "description": "",
8
+ "download_checksums": {
9
+ "hf://datasets/AudioLLMs/alpaca_audio_test@7eb2ab279975033690d67bee66e45eb612a430ee/data/test-00000-of-00001.parquet": {
10
+ "num_bytes": 12245608,
11
+ "checksum": null
12
+ }
13
+ },
14
+ "download_size": 12245608,
15
+ "features": {
16
+ "context": {
17
+ "_type": "Audio"
18
+ },
19
+ "instruction": {
20
+ "dtype": "string",
21
+ "_type": "Value"
22
+ },
23
+ "speech_instruction": {
24
+ "dtype": "string",
25
+ "_type": "Value"
26
+ },
27
+ "answer": {
28
+ "dtype": "string",
29
+ "_type": "Value"
30
+ }
31
+ },
32
+ "homepage": "",
33
+ "license": "",
34
+ "size_in_bytes": 26110929,
35
+ "splits": {
36
+ "test": {
37
+ "name": "test",
38
+ "num_bytes": 13865321,
39
+ "num_examples": 100,
40
+ "dataset_name": "alpaca_audio_test"
41
+ }
42
+ },
43
+ "version": {
44
+ "version_str": "0.0.0",
45
+ "major": 0,
46
+ "minor": 0,
47
+ "patch": 0
48
+ }
49
+ }
examples/alpaca_audio_test/state.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "a7169220e58f4523",
8
+ "_format_columns": null,
9
+ "_format_kwargs": {},
10
+ "_format_type": null,
11
+ "_output_all_columns": false,
12
+ "_split": null
13
+ }
examples/audiocaps_qa_test/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc4745b0e32ece9d9f32f5a5a689eb5e24ca6755f114cd2b1f1f445819fa1375
3
+ size 103208
examples/audiocaps_qa_test/dataset_info.json ADDED
@@ -0,0 +1,45 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "builder_name": "parquet",
3
+ "citation": "",
4
+ "config_name": "default",
5
+ "dataset_name": "audiocaps_qa_test_v3",
6
+ "dataset_size": 98835422,
7
+ "description": "",
8
+ "download_checksums": {
9
+ "hf://datasets/AudioLLMs/audiocaps_qa_test_v3@6cf6853c52f55482126f226a8859eb71f2021e0e/data/test-00000-of-00001.parquet": {
10
+ "num_bytes": 92241687,
11
+ "checksum": null
12
+ }
13
+ },
14
+ "download_size": 92241687,
15
+ "features": {
16
+ "context": {
17
+ "_type": "Audio"
18
+ },
19
+ "instruction": {
20
+ "dtype": "string",
21
+ "_type": "Value"
22
+ },
23
+ "answer": {
24
+ "dtype": "string",
25
+ "_type": "Value"
26
+ }
27
+ },
28
+ "homepage": "",
29
+ "license": "",
30
+ "size_in_bytes": 191077109,
31
+ "splits": {
32
+ "test": {
33
+ "name": "test",
34
+ "num_bytes": 98835422,
35
+ "num_examples": 313,
36
+ "dataset_name": "audiocaps_qa_test_v3"
37
+ }
38
+ },
39
+ "version": {
40
+ "version_str": "0.0.0",
41
+ "major": 0,
42
+ "minor": 0,
43
+ "patch": 0
44
+ }
45
+ }
examples/audiocaps_qa_test/state.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "748c6693112f77f2",
8
+ "_format_columns": null,
9
+ "_format_kwargs": {},
10
+ "_format_type": null,
11
+ "_output_all_columns": false,
12
+ "_split": null
13
+ }
examples/audiocaps_test/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cfff9093667c39e6750f23693d4d817193a0fbb829e3c6155d4a4c44462a184
3
+ size 107320
examples/audiocaps_test/dataset_info.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "builder_name": "parquet",
3
+ "citation": "",
4
+ "config_name": "default",
5
+ "dataset_name": "audiocaps_test",
6
+ "dataset_size": 1389113784,
7
+ "description": "",
8
+ "download_checksums": {
9
+ "hf://datasets/AudioLLMs/audiocaps_test@fb42aac15212cbddd723fbbf04b6071b60a9f8fe/data/test-00000-of-00003.parquet": {
10
+ "num_bytes": 432299885,
11
+ "checksum": null
12
+ },
13
+ "hf://datasets/AudioLLMs/audiocaps_test@fb42aac15212cbddd723fbbf04b6071b60a9f8fe/data/test-00001-of-00003.parquet": {
14
+ "num_bytes": 435786346,
15
+ "checksum": null
16
+ },
17
+ "hf://datasets/AudioLLMs/audiocaps_test@fb42aac15212cbddd723fbbf04b6071b60a9f8fe/data/test-00002-of-00003.parquet": {
18
+ "num_bytes": 435930887,
19
+ "checksum": null
20
+ }
21
+ },
22
+ "download_size": 1304017118,
23
+ "features": {
24
+ "context": {
25
+ "_type": "Audio"
26
+ },
27
+ "instruction": {
28
+ "dtype": "string",
29
+ "_type": "Value"
30
+ },
31
+ "answer": {
32
+ "dtype": "string",
33
+ "_type": "Value"
34
+ }
35
+ },
36
+ "homepage": "",
37
+ "license": "",
38
+ "size_in_bytes": 2693130902,
39
+ "splits": {
40
+ "test": {
41
+ "name": "test",
42
+ "num_bytes": 1389113784,
43
+ "num_examples": 4400,
44
+ "shard_lengths": [
45
+ 1667,
46
+ 1667,
47
+ 1066
48
+ ],
49
+ "dataset_name": "audiocaps_test"
50
+ }
51
+ },
52
+ "version": {
53
+ "version_str": "0.0.0",
54
+ "major": 0,
55
+ "minor": 0,
56
+ "patch": 0
57
+ }
58
+ }
examples/audiocaps_test/state.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "1872292586a4b460",
8
+ "_format_columns": null,
9
+ "_format_kwargs": {},
10
+ "_format_type": null,
11
+ "_output_all_columns": false,
12
+ "_split": null
13
+ }
examples/clotho_aqa_test/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ad7fcb1e24f43a32efd32f08888b84f2ff5ebd275e43ca26e6230c7d01922cf
3
+ size 194400
examples/clotho_aqa_test/dataset_info.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "builder_name": "parquet",
3
+ "citation": "",
4
+ "config_name": "default",
5
+ "dataset_name": "clotho_asqa_test_v2",
6
+ "dataset_size": 1485321871,
7
+ "description": "",
8
+ "download_checksums": {
9
+ "hf://datasets/AudioLLMs/clotho_asqa_test_v2@a7f4a7983d490e87a79eb041fede83e418c0ea4f/data/test-00000-of-00003.parquet": {
10
+ "num_bytes": 118559858,
11
+ "checksum": null
12
+ },
13
+ "hf://datasets/AudioLLMs/clotho_asqa_test_v2@a7f4a7983d490e87a79eb041fede83e418c0ea4f/data/test-00001-of-00003.parquet": {
14
+ "num_bytes": 116519615,
15
+ "checksum": null
16
+ },
17
+ "hf://datasets/AudioLLMs/clotho_asqa_test_v2@a7f4a7983d490e87a79eb041fede83e418c0ea4f/data/test-00002-of-00003.parquet": {
18
+ "num_bytes": 113032047,
19
+ "checksum": null
20
+ }
21
+ },
22
+ "download_size": 348111520,
23
+ "features": {
24
+ "context": {
25
+ "_type": "Audio"
26
+ },
27
+ "instruction": {
28
+ "dtype": "string",
29
+ "_type": "Value"
30
+ },
31
+ "answer": {
32
+ "dtype": "string",
33
+ "_type": "Value"
34
+ }
35
+ },
36
+ "homepage": "",
37
+ "license": "",
38
+ "size_in_bytes": 1833433391,
39
+ "splits": {
40
+ "test": {
41
+ "name": "test",
42
+ "num_bytes": 1485321871,
43
+ "num_examples": 2057,
44
+ "shard_lengths": [
45
+ 786,
46
+ 786,
47
+ 485
48
+ ],
49
+ "dataset_name": "clotho_asqa_test_v2"
50
+ }
51
+ },
52
+ "version": {
53
+ "version_str": "0.0.0",
54
+ "major": 0,
55
+ "minor": 0,
56
+ "patch": 0
57
+ }
58
+ }
examples/clotho_aqa_test/state.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "35d1627b19106626",
8
+ "_format_columns": null,
9
+ "_format_kwargs": {},
10
+ "_format_type": null,
11
+ "_output_all_columns": false,
12
+ "_split": null
13
+ }
examples/cn_college_listen_mcq_test/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3131dbbd9306a9622d446f8f151f1db0dd7ba3a14bd82f711126d159a813d5d5
3
+ size 152776
examples/cn_college_listen_mcq_test/dataset_info.json ADDED
@@ -0,0 +1,66 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "builder_name": "parquet",
3
+ "citation": "",
4
+ "config_name": "default",
5
+ "dataset_name": "cn_college_listen_mcq_test",
6
+ "dataset_size": 1532841284,
7
+ "description": "",
8
+ "download_checksums": {
9
+ "hf://datasets/AudioLLMs/cn_college_listen_mcq_test@708d8ef278b5eadae714c314889f5d81ded18a25/data/test-00000-of-00004.parquet": {
10
+ "num_bytes": 283046288,
11
+ "checksum": null
12
+ },
13
+ "hf://datasets/AudioLLMs/cn_college_listen_mcq_test@708d8ef278b5eadae714c314889f5d81ded18a25/data/test-00001-of-00004.parquet": {
14
+ "num_bytes": 241939389,
15
+ "checksum": null
16
+ },
17
+ "hf://datasets/AudioLLMs/cn_college_listen_mcq_test@708d8ef278b5eadae714c314889f5d81ded18a25/data/test-00002-of-00004.parquet": {
18
+ "num_bytes": 248376444,
19
+ "checksum": null
20
+ },
21
+ "hf://datasets/AudioLLMs/cn_college_listen_mcq_test@708d8ef278b5eadae714c314889f5d81ded18a25/data/test-00003-of-00004.parquet": {
22
+ "num_bytes": 256294919,
23
+ "checksum": null
24
+ }
25
+ },
26
+ "download_size": 1029657040,
27
+ "features": {
28
+ "context": {
29
+ "_type": "Audio"
30
+ },
31
+ "instruction": {
32
+ "dtype": "string",
33
+ "_type": "Value"
34
+ },
35
+ "choices": {
36
+ "dtype": "string",
37
+ "_type": "Value"
38
+ },
39
+ "answer": {
40
+ "dtype": "string",
41
+ "_type": "Value"
42
+ }
43
+ },
44
+ "homepage": "",
45
+ "license": "",
46
+ "size_in_bytes": 2562498324,
47
+ "splits": {
48
+ "test": {
49
+ "name": "test",
50
+ "num_bytes": 1532841284,
51
+ "num_examples": 2271,
52
+ "shard_lengths": [
53
+ 500,
54
+ 1036,
55
+ 735
56
+ ],
57
+ "dataset_name": "cn_college_listen_mcq_test"
58
+ }
59
+ },
60
+ "version": {
61
+ "version_str": "0.0.0",
62
+ "major": 0,
63
+ "minor": 0,
64
+ "patch": 0
65
+ }
66
+ }
examples/cn_college_listen_mcq_test/state.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "d42e39c8837074fc",
8
+ "_format_columns": null,
9
+ "_format_kwargs": {},
10
+ "_format_type": null,
11
+ "_output_all_columns": false,
12
+ "_split": null
13
+ }
examples/cna_test/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d37e6858c1291ebeb2bcb6bfbe8f5291da48f4199a46ae88a60eb57fa135b61f
3
+ size 34600
examples/cna_test/dataset_info.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "citation": "",
3
+ "description": "",
4
+ "features": {
5
+ "context": {
6
+ "sampling_rate": 16000,
7
+ "_type": "Audio"
8
+ },
9
+ "instruction": {
10
+ "dtype": "string",
11
+ "_type": "Value"
12
+ },
13
+ "answer": {
14
+ "dtype": "string",
15
+ "_type": "Value"
16
+ }
17
+ },
18
+ "homepage": "",
19
+ "license": ""
20
+ }
examples/cna_test/state.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "22ae0abf541af796",
8
+ "_format_columns": null,
9
+ "_format_kwargs": {},
10
+ "_format_type": null,
11
+ "_output_all_columns": false,
12
+ "_split": null
13
+ }
examples/common_voice_15_en_test/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd5f49efa47828a4a7b9a6fc584b19562acae2f90451219939b0c11b4d41621f
3
+ size 54992
examples/common_voice_15_en_test/dataset_info.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "citation": "",
3
+ "description": "",
4
+ "features": {
5
+ "context": {
6
+ "sampling_rate": 16000,
7
+ "_type": "Audio"
8
+ },
9
+ "instruction": {
10
+ "dtype": "string",
11
+ "_type": "Value"
12
+ },
13
+ "answer": {
14
+ "dtype": "string",
15
+ "_type": "Value"
16
+ },
17
+ "language": {
18
+ "dtype": "string",
19
+ "_type": "Value"
20
+ },
21
+ "audio_length": {
22
+ "dtype": "float64",
23
+ "_type": "Value"
24
+ }
25
+ },
26
+ "homepage": "",
27
+ "license": ""
28
+ }
examples/common_voice_15_en_test/state.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "62012827f888a0f5",
8
+ "_format_columns": [
9
+ "answer",
10
+ "audio_length",
11
+ "context",
12
+ "instruction",
13
+ "language"
14
+ ],
15
+ "_format_kwargs": {},
16
+ "_format_type": null,
17
+ "_output_all_columns": false,
18
+ "_split": null
19
+ }
examples/commonvoice_17_id_asr/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae05a4b823184603908f2b4149190b4fab9965be5468f6b4fa34e0e214c97760
3
+ size 43784
examples/commonvoice_17_id_asr/dataset_info.json ADDED
@@ -0,0 +1,132 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "builder_name": "common_voice_17_0",
3
+ "citation": "@inproceedings{commonvoice:2020,\n author = {Ardila, R. and Branson, M. and Davis, K. and Henretty, M. and Kohler, M. and Meyer, J. and Morais, R. and Saunders, L. and Tyers, F. M. and Weber, G.},\n title = {Common Voice: A Massively-Multilingual Speech Corpus},\n booktitle = {Proceedings of the 12th Conference on Language Resources and Evaluation (LREC 2020)},\n pages = {4211--4215},\n year = 2020\n}\n",
4
+ "config_name": "id",
5
+ "dataset_name": "common_voice_17_0",
6
+ "dataset_size": 42157018,
7
+ "description": "Common Voice is Mozilla's initiative to help teach machines how real people speak. The dataset currently consists of 20408 validated hours of speech in 124 languages, but more voices and languages are always added.",
8
+ "download_checksums": {
9
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/n_shards.json": {
10
+ "num_bytes": 17491,
11
+ "checksum": null
12
+ },
13
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/id/train/id_train_0.tar": {
14
+ "num_bytes": 170035200,
15
+ "checksum": null
16
+ },
17
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/id/dev/id_dev_0.tar": {
18
+ "num_bytes": 102236160,
19
+ "checksum": null
20
+ },
21
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/id/test/id_test_0.tar": {
22
+ "num_bytes": 110315520,
23
+ "checksum": null
24
+ },
25
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/id/other/id_other_0.tar": {
26
+ "num_bytes": 686858240,
27
+ "checksum": null
28
+ },
29
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/id/invalidated/id_invalidated_0.tar": {
30
+ "num_bytes": 68034560,
31
+ "checksum": null
32
+ },
33
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/id/validated/id_validated_0.tar": {
34
+ "num_bytes": 805611520,
35
+ "checksum": null
36
+ },
37
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/id/train.tsv": {
38
+ "num_bytes": 1571021,
39
+ "checksum": null
40
+ },
41
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/id/dev.tsv": {
42
+ "num_bytes": 1016964,
43
+ "checksum": null
44
+ },
45
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/id/test.tsv": {
46
+ "num_bytes": 1052525,
47
+ "checksum": null
48
+ },
49
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/id/other.tsv": {
50
+ "num_bytes": 8607181,
51
+ "checksum": null
52
+ },
53
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/id/invalidated.tsv": {
54
+ "num_bytes": 784798,
55
+ "checksum": null
56
+ },
57
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/id/validated.tsv": {
58
+ "num_bytes": 7772548,
59
+ "checksum": null
60
+ }
61
+ },
62
+ "download_size": 1963913728,
63
+ "features": {
64
+ "context": {
65
+ "sampling_rate": 16000,
66
+ "_type": "Audio"
67
+ },
68
+ "instruction": {
69
+ "dtype": "string",
70
+ "_type": "Value"
71
+ },
72
+ "answer": {
73
+ "dtype": "string",
74
+ "_type": "Value"
75
+ },
76
+ "audio_length": {
77
+ "dtype": "float64",
78
+ "_type": "Value"
79
+ },
80
+ "language": {
81
+ "dtype": "string",
82
+ "_type": "Value"
83
+ }
84
+ },
85
+ "homepage": "https://commonvoice.mozilla.org/en/datasets",
86
+ "license": "https://creativecommons.org/publicdomain/zero/1.0/",
87
+ "size_in_bytes": 2006070746,
88
+ "splits": {
89
+ "train": {
90
+ "name": "train",
91
+ "num_bytes": 3067499,
92
+ "num_examples": 4970,
93
+ "dataset_name": "common_voice_17_0"
94
+ },
95
+ "validation": {
96
+ "name": "validation",
97
+ "num_bytes": 2011909,
98
+ "num_examples": 3349,
99
+ "dataset_name": "common_voice_17_0"
100
+ },
101
+ "test": {
102
+ "name": "test",
103
+ "num_bytes": 2141524,
104
+ "num_examples": 3641,
105
+ "dataset_name": "common_voice_17_0"
106
+ },
107
+ "other": {
108
+ "name": "other",
109
+ "num_bytes": 17492664,
110
+ "num_examples": 29508,
111
+ "dataset_name": "common_voice_17_0"
112
+ },
113
+ "invalidated": {
114
+ "name": "invalidated",
115
+ "num_bytes": 1600375,
116
+ "num_examples": 2605,
117
+ "dataset_name": "common_voice_17_0"
118
+ },
119
+ "validated": {
120
+ "name": "validated",
121
+ "num_bytes": 15843047,
122
+ "num_examples": 26108,
123
+ "dataset_name": "common_voice_17_0"
124
+ }
125
+ },
126
+ "version": {
127
+ "version_str": "17.0.0",
128
+ "major": 17,
129
+ "minor": 0,
130
+ "patch": 0
131
+ }
132
+ }
examples/commonvoice_17_id_asr/state.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "75931a254b089787",
8
+ "_format_columns": null,
9
+ "_format_kwargs": {},
10
+ "_format_type": null,
11
+ "_output_all_columns": false,
12
+ "_split": null
13
+ }
examples/commonvoice_17_ta_asr/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98470c84b50bb5c1b10476e4f6ea518ddd9127b64b0c680302f774af7b538b71
3
+ size 90616
examples/commonvoice_17_ta_asr/dataset_info.json ADDED
@@ -0,0 +1,156 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "builder_name": "common_voice_17_0",
3
+ "citation": "@inproceedings{commonvoice:2020,\n author = {Ardila, R. and Branson, M. and Davis, K. and Henretty, M. and Kohler, M. and Meyer, J. and Morais, R. and Saunders, L. and Tyers, F. M. and Weber, G.},\n title = {Common Voice: A Massively-Multilingual Speech Corpus},\n booktitle = {Proceedings of the 12th Conference on Language Resources and Evaluation (LREC 2020)},\n pages = {4211--4215},\n year = 2020\n}\n",
4
+ "config_name": "ta",
5
+ "dataset_name": "common_voice_17_0",
6
+ "dataset_size": 221361139,
7
+ "description": "Common Voice is Mozilla's initiative to help teach machines how real people speak. The dataset currently consists of 20408 validated hours of speech in 124 languages, but more voices and languages are always added.",
8
+ "download_checksums": {
9
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/n_shards.json": {
10
+ "num_bytes": 17491,
11
+ "checksum": null
12
+ },
13
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/train/ta_train_0.tar": {
14
+ "num_bytes": 1598955520,
15
+ "checksum": null
16
+ },
17
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/train/ta_train_1.tar": {
18
+ "num_bytes": 224542720,
19
+ "checksum": null
20
+ },
21
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/dev/ta_dev_0.tar": {
22
+ "num_bytes": 434257920,
23
+ "checksum": null
24
+ },
25
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/test/ta_test_0.tar": {
26
+ "num_bytes": 454778880,
27
+ "checksum": null
28
+ },
29
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/other/ta_other_0.tar": {
30
+ "num_bytes": 1560514560,
31
+ "checksum": null
32
+ },
33
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/other/ta_other_1.tar": {
34
+ "num_bytes": 1515827200,
35
+ "checksum": null
36
+ },
37
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/other/ta_other_2.tar": {
38
+ "num_bytes": 495831040,
39
+ "checksum": null
40
+ },
41
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/invalidated/ta_invalidated_0.tar": {
42
+ "num_bytes": 231424000,
43
+ "checksum": null
44
+ },
45
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/validated/ta_validated_0.tar": {
46
+ "num_bytes": 1447434240,
47
+ "checksum": null
48
+ },
49
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/validated/ta_validated_1.tar": {
50
+ "num_bytes": 1530644480,
51
+ "checksum": null
52
+ },
53
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/validated/ta_validated_2.tar": {
54
+ "num_bytes": 1654978560,
55
+ "checksum": null
56
+ },
57
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/validated/ta_validated_3.tar": {
58
+ "num_bytes": 652861440,
59
+ "checksum": null
60
+ },
61
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/ta/train.tsv": {
62
+ "num_bytes": 19608830,
63
+ "checksum": null
64
+ },
65
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/ta/dev.tsv": {
66
+ "num_bytes": 5203704,
67
+ "checksum": null
68
+ },
69
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/ta/test.tsv": {
70
+ "num_bytes": 4944646,
71
+ "checksum": null
72
+ },
73
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/ta/other.tsv": {
74
+ "num_bytes": 39470943,
75
+ "checksum": null
76
+ },
77
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/ta/invalidated.tsv": {
78
+ "num_bytes": 2499761,
79
+ "checksum": null
80
+ },
81
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/ta/validated.tsv": {
82
+ "num_bytes": 56763398,
83
+ "checksum": null
84
+ }
85
+ },
86
+ "download_size": 11930559333,
87
+ "features": {
88
+ "context": {
89
+ "sampling_rate": 16000,
90
+ "_type": "Audio"
91
+ },
92
+ "instruction": {
93
+ "dtype": "string",
94
+ "_type": "Value"
95
+ },
96
+ "answer": {
97
+ "dtype": "string",
98
+ "_type": "Value"
99
+ },
100
+ "audio_length": {
101
+ "dtype": "float64",
102
+ "_type": "Value"
103
+ },
104
+ "language": {
105
+ "dtype": "string",
106
+ "_type": "Value"
107
+ }
108
+ },
109
+ "homepage": "https://commonvoice.mozilla.org/en/datasets",
110
+ "license": "https://creativecommons.org/publicdomain/zero/1.0/",
111
+ "size_in_bytes": 12151920472,
112
+ "splits": {
113
+ "train": {
114
+ "name": "train",
115
+ "num_bytes": 33336098,
116
+ "num_examples": 45587,
117
+ "dataset_name": "common_voice_17_0"
118
+ },
119
+ "validation": {
120
+ "name": "validation",
121
+ "num_bytes": 8797317,
122
+ "num_examples": 12095,
123
+ "dataset_name": "common_voice_17_0"
124
+ },
125
+ "test": {
126
+ "name": "test",
127
+ "num_bytes": 8556167,
128
+ "num_examples": 12074,
129
+ "dataset_name": "common_voice_17_0"
130
+ },
131
+ "other": {
132
+ "name": "other",
133
+ "num_bytes": 67773267,
134
+ "num_examples": 93989,
135
+ "dataset_name": "common_voice_17_0"
136
+ },
137
+ "invalidated": {
138
+ "name": "invalidated",
139
+ "num_bytes": 4282268,
140
+ "num_examples": 5693,
141
+ "dataset_name": "common_voice_17_0"
142
+ },
143
+ "validated": {
144
+ "name": "validated",
145
+ "num_bytes": 98616022,
146
+ "num_examples": 135391,
147
+ "dataset_name": "common_voice_17_0"
148
+ }
149
+ },
150
+ "version": {
151
+ "version_str": "17.0.0",
152
+ "major": 17,
153
+ "minor": 0,
154
+ "patch": 0
155
+ }
156
+ }
examples/commonvoice_17_ta_asr/state.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "380f8a99e8b3657c",
8
+ "_format_columns": null,
9
+ "_format_kwargs": {},
10
+ "_format_type": null,
11
+ "_output_all_columns": false,
12
+ "_split": null
13
+ }
examples/commonvoice_17_th_asr/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfd84989250d4b79f4cb4b0ae5028d032e221858d6dab77494a04a8a2336aab4
3
+ size 44792
examples/commonvoice_17_th_asr/dataset_info.json ADDED
@@ -0,0 +1,164 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "builder_name": "common_voice_17_0",
3
+ "citation": "@inproceedings{commonvoice:2020,\n author = {Ardila, R. and Branson, M. and Davis, K. and Henretty, M. and Kohler, M. and Meyer, J. and Morais, R. and Saunders, L. and Tyers, F. M. and Weber, G.},\n title = {Common Voice: A Massively-Multilingual Speech Corpus},\n booktitle = {Proceedings of the 12th Conference on Language Resources and Evaluation (LREC 2020)},\n pages = {4211--4215},\n year = 2020\n}\n",
4
+ "config_name": "th",
5
+ "dataset_name": "common_voice_17_0",
6
+ "dataset_size": 271837409,
7
+ "description": "Common Voice is Mozilla's initiative to help teach machines how real people speak. The dataset currently consists of 20408 validated hours of speech in 124 languages, but more voices and languages are always added.",
8
+ "download_checksums": {
9
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/n_shards.json": {
10
+ "num_bytes": 17491,
11
+ "checksum": null
12
+ },
13
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/train/th_train_0.tar": {
14
+ "num_bytes": 838082560,
15
+ "checksum": null
16
+ },
17
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/dev/th_dev_0.tar": {
18
+ "num_bytes": 323399680,
19
+ "checksum": null
20
+ },
21
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/test/th_test_0.tar": {
22
+ "num_bytes": 335851520,
23
+ "checksum": null
24
+ },
25
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/other/th_other_0.tar": {
26
+ "num_bytes": 1147064320,
27
+ "checksum": null
28
+ },
29
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/other/th_other_1.tar": {
30
+ "num_bytes": 1057300480,
31
+ "checksum": null
32
+ },
33
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/other/th_other_2.tar": {
34
+ "num_bytes": 943237120,
35
+ "checksum": null
36
+ },
37
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/other/th_other_3.tar": {
38
+ "num_bytes": 837079040,
39
+ "checksum": null
40
+ },
41
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/other/th_other_4.tar": {
42
+ "num_bytes": 1055385600,
43
+ "checksum": null
44
+ },
45
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/other/th_other_5.tar": {
46
+ "num_bytes": 176015360,
47
+ "checksum": null
48
+ },
49
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/invalidated/th_invalidated_0.tar": {
50
+ "num_bytes": 287416320,
51
+ "checksum": null
52
+ },
53
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/validated/th_validated_0.tar": {
54
+ "num_bytes": 1191843840,
55
+ "checksum": null
56
+ },
57
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/validated/th_validated_1.tar": {
58
+ "num_bytes": 1079930880,
59
+ "checksum": null
60
+ },
61
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/validated/th_validated_2.tar": {
62
+ "num_bytes": 1014691840,
63
+ "checksum": null
64
+ },
65
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/validated/th_validated_3.tar": {
66
+ "num_bytes": 744366080,
67
+ "checksum": null
68
+ },
69
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/th/train.tsv": {
70
+ "num_bytes": 11337047,
71
+ "checksum": null
72
+ },
73
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/th/dev.tsv": {
74
+ "num_bytes": 3803758,
75
+ "checksum": null
76
+ },
77
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/th/test.tsv": {
78
+ "num_bytes": 3702050,
79
+ "checksum": null
80
+ },
81
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/th/other.tsv": {
82
+ "num_bytes": 71870764,
83
+ "checksum": null
84
+ },
85
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/th/invalidated.tsv": {
86
+ "num_bytes": 3301372,
87
+ "checksum": null
88
+ },
89
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/th/validated.tsv": {
90
+ "num_bytes": 50649618,
91
+ "checksum": null
92
+ }
93
+ },
94
+ "download_size": 11176346740,
95
+ "features": {
96
+ "context": {
97
+ "sampling_rate": 16000,
98
+ "_type": "Audio"
99
+ },
100
+ "instruction": {
101
+ "dtype": "string",
102
+ "_type": "Value"
103
+ },
104
+ "answer": {
105
+ "dtype": "string",
106
+ "_type": "Value"
107
+ },
108
+ "audio_length": {
109
+ "dtype": "float64",
110
+ "_type": "Value"
111
+ },
112
+ "language": {
113
+ "dtype": "string",
114
+ "_type": "Value"
115
+ }
116
+ },
117
+ "homepage": "https://commonvoice.mozilla.org/en/datasets",
118
+ "license": "https://creativecommons.org/publicdomain/zero/1.0/",
119
+ "size_in_bytes": 11448184149,
120
+ "splits": {
121
+ "train": {
122
+ "name": "train",
123
+ "num_bytes": 21220759,
124
+ "num_examples": 32823,
125
+ "dataset_name": "common_voice_17_0"
126
+ },
127
+ "validation": {
128
+ "name": "validation",
129
+ "num_bytes": 7084499,
130
+ "num_examples": 11042,
131
+ "dataset_name": "common_voice_17_0"
132
+ },
133
+ "test": {
134
+ "name": "test",
135
+ "num_bytes": 7004874,
136
+ "num_examples": 11042,
137
+ "dataset_name": "common_voice_17_0"
138
+ },
139
+ "other": {
140
+ "name": "other",
141
+ "num_bytes": 134183952,
142
+ "num_examples": 206935,
143
+ "dataset_name": "common_voice_17_0"
144
+ },
145
+ "invalidated": {
146
+ "name": "invalidated",
147
+ "num_bytes": 6202988,
148
+ "num_examples": 9267,
149
+ "dataset_name": "common_voice_17_0"
150
+ },
151
+ "validated": {
152
+ "name": "validated",
153
+ "num_bytes": 96140337,
154
+ "num_examples": 147160,
155
+ "dataset_name": "common_voice_17_0"
156
+ }
157
+ },
158
+ "version": {
159
+ "version_str": "17.0.0",
160
+ "major": 17,
161
+ "minor": 0,
162
+ "patch": 0
163
+ }
164
+ }
examples/commonvoice_17_th_asr/state.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "4b0c4a31664c7d67",
8
+ "_format_columns": null,
9
+ "_format_kwargs": {},
10
+ "_format_type": null,
11
+ "_output_all_columns": false,
12
+ "_split": null
13
+ }
examples/commonvoice_17_vi_asr/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4249665ed76ad59af6281a9c0bacc6862d8cd750218637cd8570bc9d89002751
3
+ size 39104
examples/commonvoice_17_vi_asr/dataset_info.json ADDED
@@ -0,0 +1,132 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "builder_name": "common_voice_17_0",
3
+ "citation": "@inproceedings{commonvoice:2020,\n author = {Ardila, R. and Branson, M. and Davis, K. and Henretty, M. and Kohler, M. and Meyer, J. and Morais, R. and Saunders, L. and Tyers, F. M. and Weber, G.},\n title = {Common Voice: A Massively-Multilingual Speech Corpus},\n booktitle = {Proceedings of the 12th Conference on Language Resources and Evaluation (LREC 2020)},\n pages = {4211--4215},\n year = 2020\n}\n",
4
+ "config_name": "vi",
5
+ "dataset_name": "common_voice_17_0",
6
+ "dataset_size": 12705254,
7
+ "description": "Common Voice is Mozilla's initiative to help teach machines how real people speak. The dataset currently consists of 20408 validated hours of speech in 124 languages, but more voices and languages are always added.",
8
+ "download_checksums": {
9
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/n_shards.json": {
10
+ "num_bytes": 17491,
11
+ "checksum": null
12
+ },
13
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/vi/train/vi_train_0.tar": {
14
+ "num_bytes": 69468160,
15
+ "checksum": null
16
+ },
17
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/vi/dev/vi_dev_0.tar": {
18
+ "num_bytes": 14479360,
19
+ "checksum": null
20
+ },
21
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/vi/test/vi_test_0.tar": {
22
+ "num_bytes": 34488320,
23
+ "checksum": null
24
+ },
25
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/vi/other/vi_other_0.tar": {
26
+ "num_bytes": 276172800,
27
+ "checksum": null
28
+ },
29
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/vi/invalidated/vi_invalidated_0.tar": {
30
+ "num_bytes": 11345920,
31
+ "checksum": null
32
+ },
33
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/vi/validated/vi_validated_0.tar": {
34
+ "num_bytes": 144384000,
35
+ "checksum": null
36
+ },
37
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/vi/train.tsv": {
38
+ "num_bytes": 688189,
39
+ "checksum": null
40
+ },
41
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/vi/dev.tsv": {
42
+ "num_bytes": 184767,
43
+ "checksum": null
44
+ },
45
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/vi/test.tsv": {
46
+ "num_bytes": 373370,
47
+ "checksum": null
48
+ },
49
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/vi/other.tsv": {
50
+ "num_bytes": 3384906,
51
+ "checksum": null
52
+ },
53
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/vi/invalidated.tsv": {
54
+ "num_bytes": 111099,
55
+ "checksum": null
56
+ },
57
+ "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/vi/validated.tsv": {
58
+ "num_bytes": 1521796,
59
+ "checksum": null
60
+ }
61
+ },
62
+ "download_size": 556620178,
63
+ "features": {
64
+ "context": {
65
+ "sampling_rate": 16000,
66
+ "_type": "Audio"
67
+ },
68
+ "instruction": {
69
+ "dtype": "string",
70
+ "_type": "Value"
71
+ },
72
+ "answer": {
73
+ "dtype": "string",
74
+ "_type": "Value"
75
+ },
76
+ "audio_length": {
77
+ "dtype": "float64",
78
+ "_type": "Value"
79
+ },
80
+ "language": {
81
+ "dtype": "string",
82
+ "_type": "Value"
83
+ }
84
+ },
85
+ "homepage": "https://commonvoice.mozilla.org/en/datasets",
86
+ "license": "https://creativecommons.org/publicdomain/zero/1.0/",
87
+ "size_in_bytes": 569325432,
88
+ "splits": {
89
+ "train": {
90
+ "name": "train",
91
+ "num_bytes": 1380061,
92
+ "num_examples": 2298,
93
+ "dataset_name": "common_voice_17_0"
94
+ },
95
+ "validation": {
96
+ "name": "validation",
97
+ "num_bytes": 375111,
98
+ "num_examples": 641,
99
+ "dataset_name": "common_voice_17_0"
100
+ },
101
+ "test": {
102
+ "name": "test",
103
+ "num_bytes": 754342,
104
+ "num_examples": 1274,
105
+ "dataset_name": "common_voice_17_0"
106
+ },
107
+ "other": {
108
+ "name": "other",
109
+ "num_bytes": 6857667,
110
+ "num_examples": 11533,
111
+ "dataset_name": "common_voice_17_0"
112
+ },
113
+ "invalidated": {
114
+ "name": "invalidated",
115
+ "num_bytes": 229034,
116
+ "num_examples": 377,
117
+ "dataset_name": "common_voice_17_0"
118
+ },
119
+ "validated": {
120
+ "name": "validated",
121
+ "num_bytes": 3109039,
122
+ "num_examples": 5135,
123
+ "dataset_name": "common_voice_17_0"
124
+ }
125
+ },
126
+ "version": {
127
+ "version_str": "17.0.0",
128
+ "major": 17,
129
+ "minor": 0,
130
+ "patch": 0
131
+ }
132
+ }
examples/commonvoice_17_vi_asr/state.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "6ce07a66a0e6d7b0",
8
+ "_format_columns": null,
9
+ "_format_kwargs": {},
10
+ "_format_type": null,
11
+ "_output_all_columns": false,
12
+ "_split": null
13
+ }
examples/commonvoice_zh_asr/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:951bb47527709c895c17e6dac4a4a43b2a141b16babd39e56d9199deaec72eb5
3
+ size 68224
examples/commonvoice_zh_asr/dataset_info.json ADDED
@@ -0,0 +1,182 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "builder_name": "common_voice_16_0",
3
+ "citation": "@inproceedings{commonvoice:2020,\n author = {Ardila, R. and Branson, M. and Davis, K. and Henretty, M. and Kohler, M. and Meyer, J. and Morais, R. and Saunders, L. and Tyers, F. M. and Weber, G.},\n title = {Common Voice: A Massively-Multilingual Speech Corpus},\n booktitle = {Proceedings of the 12th Conference on Language Resources and Evaluation (LREC 2020)},\n pages = {4211--4215},\n year = 2020\n}\n",
4
+ "config_name": "zh-CN",
5
+ "dataset_name": "common_voice_16_0",
6
+ "dataset_size": 423983727,
7
+ "description": "Common Voice is Mozilla's initiative to help teach machines how real people speak. The dataset currently consists of 19159 validated hours of speech in 119 languages, but more voices and languages are always added.",
8
+ "download_checksums": {
9
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/n_shards.json": {
10
+ "num_bytes": 17487,
11
+ "checksum": null
12
+ },
13
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/train/zh-CN_train_0.tar": {
14
+ "num_bytes": 1157220864,
15
+ "checksum": null
16
+ },
17
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/dev/zh-CN_dev_0.tar": {
18
+ "num_bytes": 436442624,
19
+ "checksum": null
20
+ },
21
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/test/zh-CN_test_0.tar": {
22
+ "num_bytes": 506296320,
23
+ "checksum": null
24
+ },
25
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_0.tar": {
26
+ "num_bytes": 1252570624,
27
+ "checksum": null
28
+ },
29
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_1.tar": {
30
+ "num_bytes": 1216365056,
31
+ "checksum": null
32
+ },
33
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_2.tar": {
34
+ "num_bytes": 1057693696,
35
+ "checksum": null
36
+ },
37
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_3.tar": {
38
+ "num_bytes": 1037878784,
39
+ "checksum": null
40
+ },
41
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_4.tar": {
42
+ "num_bytes": 1006488064,
43
+ "checksum": null
44
+ },
45
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_5.tar": {
46
+ "num_bytes": 951297024,
47
+ "checksum": null
48
+ },
49
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_6.tar": {
50
+ "num_bytes": 1054305280,
51
+ "checksum": null
52
+ },
53
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_7.tar": {
54
+ "num_bytes": 1079122944,
55
+ "checksum": null
56
+ },
57
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_8.tar": {
58
+ "num_bytes": 1057605632,
59
+ "checksum": null
60
+ },
61
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_9.tar": {
62
+ "num_bytes": 1054744064,
63
+ "checksum": null
64
+ },
65
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_10.tar": {
66
+ "num_bytes": 1037184512,
67
+ "checksum": null
68
+ },
69
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_11.tar": {
70
+ "num_bytes": 1081821184,
71
+ "checksum": null
72
+ },
73
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_12.tar": {
74
+ "num_bytes": 1144596992,
75
+ "checksum": null
76
+ },
77
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_13.tar": {
78
+ "num_bytes": 1211527680,
79
+ "checksum": null
80
+ },
81
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_14.tar": {
82
+ "num_bytes": 1190928384,
83
+ "checksum": null
84
+ },
85
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_15.tar": {
86
+ "num_bytes": 299709952,
87
+ "checksum": null
88
+ },
89
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/invalidated/zh-CN_invalidated_0.tar": {
90
+ "num_bytes": 1000983552,
91
+ "checksum": null
92
+ },
93
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/invalidated/zh-CN_invalidated_1.tar": {
94
+ "num_bytes": 416471552,
95
+ "checksum": null
96
+ },
97
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/transcript/zh-CN/train.tsv": {
98
+ "num_bytes": 7373507,
99
+ "checksum": null
100
+ },
101
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/transcript/zh-CN/dev.tsv": {
102
+ "num_bytes": 2567399,
103
+ "checksum": null
104
+ },
105
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/transcript/zh-CN/test.tsv": {
106
+ "num_bytes": 2457920,
107
+ "checksum": null
108
+ },
109
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/transcript/zh-CN/other.tsv": {
110
+ "num_bytes": 137605043,
111
+ "checksum": null
112
+ },
113
+ "https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/transcript/zh-CN/invalidated.tsv": {
114
+ "num_bytes": 13622503,
115
+ "checksum": null
116
+ }
117
+ },
118
+ "download_size": 20414898643,
119
+ "features": {
120
+ "context": {
121
+ "sampling_rate": 16000,
122
+ "_type": "Audio"
123
+ },
124
+ "instruction": {
125
+ "dtype": "string",
126
+ "_type": "Value"
127
+ },
128
+ "answer": {
129
+ "dtype": "string",
130
+ "_type": "Value"
131
+ },
132
+ "audio_length": {
133
+ "dtype": "float64",
134
+ "_type": "Value"
135
+ },
136
+ "language": {
137
+ "dtype": "string",
138
+ "_type": "Value"
139
+ }
140
+ },
141
+ "homepage": "https://commonvoice.mozilla.org/en/datasets",
142
+ "license": "https://creativecommons.org/publicdomain/zero/1.0/",
143
+ "size_in_bytes": 20838882370,
144
+ "splits": {
145
+ "train": {
146
+ "name": "train",
147
+ "num_bytes": 17963235,
148
+ "num_examples": 29406,
149
+ "dataset_name": "common_voice_16_0"
150
+ },
151
+ "validation": {
152
+ "name": "validation",
153
+ "num_bytes": 6351483,
154
+ "num_examples": 10626,
155
+ "dataset_name": "common_voice_16_0"
156
+ },
157
+ "test": {
158
+ "name": "test",
159
+ "num_bytes": 6263265,
160
+ "num_examples": 10626,
161
+ "dataset_name": "common_voice_16_0"
162
+ },
163
+ "other": {
164
+ "name": "other",
165
+ "num_bytes": 358056452,
166
+ "num_examples": 610981,
167
+ "dataset_name": "common_voice_16_0"
168
+ },
169
+ "invalidated": {
170
+ "name": "invalidated",
171
+ "num_bytes": 35349292,
172
+ "num_examples": 58386,
173
+ "dataset_name": "common_voice_16_0"
174
+ }
175
+ },
176
+ "version": {
177
+ "version_str": "15.0.0",
178
+ "major": 15,
179
+ "minor": 0,
180
+ "patch": 0
181
+ }
182
+ }
examples/commonvoice_zh_asr/state.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "41452271d4051e81",
8
+ "_format_columns": null,
9
+ "_format_kwargs": {},
10
+ "_format_type": null,
11
+ "_output_all_columns": false,
12
+ "_split": null
13
+ }
examples/covost2_en_id_test/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d4bfb1098a59bf75aab6b9b824141808bb48160787b182b03fabf4a56527a9e
3
+ size 56496
examples/covost2_en_id_test/dataset_info.json ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "builder_name": "parquet",
3
+ "citation": "",
4
+ "config_name": "default",
5
+ "dataset_name": "covost2_en_id_test_v1",
6
+ "dataset_size": 2842304040,
7
+ "description": "",
8
+ "download_checksums": {
9
+ "hf://datasets/AudioLLMs/covost2_en_id_test_v1@51a4b1517f07e1dcf9180aa270f264961165cab3/data/test-00000-of-00006.parquet": {
10
+ "num_bytes": 421383822,
11
+ "checksum": null
12
+ },
13
+ "hf://datasets/AudioLLMs/covost2_en_id_test_v1@51a4b1517f07e1dcf9180aa270f264961165cab3/data/test-00001-of-00006.parquet": {
14
+ "num_bytes": 430366828,
15
+ "checksum": null
16
+ },
17
+ "hf://datasets/AudioLLMs/covost2_en_id_test_v1@51a4b1517f07e1dcf9180aa270f264961165cab3/data/test-00002-of-00006.parquet": {
18
+ "num_bytes": 423203231,
19
+ "checksum": null
20
+ },
21
+ "hf://datasets/AudioLLMs/covost2_en_id_test_v1@51a4b1517f07e1dcf9180aa270f264961165cab3/data/test-00003-of-00006.parquet": {
22
+ "num_bytes": 420946330,
23
+ "checksum": null
24
+ },
25
+ "hf://datasets/AudioLLMs/covost2_en_id_test_v1@51a4b1517f07e1dcf9180aa270f264961165cab3/data/test-00004-of-00006.parquet": {
26
+ "num_bytes": 419734090,
27
+ "checksum": null
28
+ },
29
+ "hf://datasets/AudioLLMs/covost2_en_id_test_v1@51a4b1517f07e1dcf9180aa270f264961165cab3/data/test-00005-of-00006.parquet": {
30
+ "num_bytes": 419963769,
31
+ "checksum": null
32
+ }
33
+ },
34
+ "download_size": 2535598070,
35
+ "features": {
36
+ "context": {
37
+ "_type": "Audio"
38
+ },
39
+ "instruction": {
40
+ "dtype": "string",
41
+ "_type": "Value"
42
+ },
43
+ "answer": {
44
+ "dtype": "string",
45
+ "_type": "Value"
46
+ }
47
+ },
48
+ "homepage": "",
49
+ "license": "",
50
+ "size_in_bytes": 5377902110,
51
+ "splits": {
52
+ "test": {
53
+ "name": "test",
54
+ "num_bytes": 2842304040,
55
+ "num_examples": 15531,
56
+ "shard_lengths": [
57
+ 2789,
58
+ 2789,
59
+ 2789,
60
+ 2788,
61
+ 2788,
62
+ 1588
63
+ ],
64
+ "dataset_name": "covost2_en_id_test_v1"
65
+ }
66
+ },
67
+ "version": {
68
+ "version_str": "0.0.0",
69
+ "major": 0,
70
+ "minor": 0,
71
+ "patch": 0
72
+ }
73
+ }
examples/covost2_en_id_test/state.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "f755c8fc2cb9504a",
8
+ "_format_columns": null,
9
+ "_format_kwargs": {},
10
+ "_format_type": null,
11
+ "_output_all_columns": false,
12
+ "_split": null
13
+ }
examples/covost2_en_ta_test/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89aa8cee7fa6754a1491ca48e31162126a808e07bca8731ecf2949bc183dd20f
3
+ size 58088
examples/covost2_en_ta_test/dataset_info.json ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "builder_name": "parquet",
3
+ "citation": "",
4
+ "config_name": "default",
5
+ "dataset_name": "covost2_en_ta_test_v1",
6
+ "dataset_size": 2844002846,
7
+ "description": "",
8
+ "download_checksums": {
9
+ "hf://datasets/AudioLLMs/covost2_en_ta_test_v1@23c23a71d698faf6c940e18753ade03acbcef86b/data/test-00000-of-00006.parquet": {
10
+ "num_bytes": 421472102,
11
+ "checksum": null
12
+ },
13
+ "hf://datasets/AudioLLMs/covost2_en_ta_test_v1@23c23a71d698faf6c940e18753ade03acbcef86b/data/test-00001-of-00006.parquet": {
14
+ "num_bytes": 430453377,
15
+ "checksum": null
16
+ },
17
+ "hf://datasets/AudioLLMs/covost2_en_ta_test_v1@23c23a71d698faf6c940e18753ade03acbcef86b/data/test-00002-of-00006.parquet": {
18
+ "num_bytes": 423289725,
19
+ "checksum": null
20
+ },
21
+ "hf://datasets/AudioLLMs/covost2_en_ta_test_v1@23c23a71d698faf6c940e18753ade03acbcef86b/data/test-00003-of-00006.parquet": {
22
+ "num_bytes": 421032929,
23
+ "checksum": null
24
+ },
25
+ "hf://datasets/AudioLLMs/covost2_en_ta_test_v1@23c23a71d698faf6c940e18753ade03acbcef86b/data/test-00004-of-00006.parquet": {
26
+ "num_bytes": 419820665,
27
+ "checksum": null
28
+ },
29
+ "hf://datasets/AudioLLMs/covost2_en_ta_test_v1@23c23a71d698faf6c940e18753ade03acbcef86b/data/test-00005-of-00006.parquet": {
30
+ "num_bytes": 420052504,
31
+ "checksum": null
32
+ }
33
+ },
34
+ "download_size": 2536121302,
35
+ "features": {
36
+ "context": {
37
+ "_type": "Audio"
38
+ },
39
+ "instruction": {
40
+ "dtype": "string",
41
+ "_type": "Value"
42
+ },
43
+ "answer": {
44
+ "dtype": "string",
45
+ "_type": "Value"
46
+ }
47
+ },
48
+ "homepage": "",
49
+ "license": "",
50
+ "size_in_bytes": 5380124148,
51
+ "splits": {
52
+ "test": {
53
+ "name": "test",
54
+ "num_bytes": 2844002846,
55
+ "num_examples": 15531,
56
+ "shard_lengths": [
57
+ 2789,
58
+ 2789,
59
+ 2789,
60
+ 2788,
61
+ 2788,
62
+ 1588
63
+ ],
64
+ "dataset_name": "covost2_en_ta_test_v1"
65
+ }
66
+ },
67
+ "version": {
68
+ "version_str": "0.0.0",
69
+ "major": 0,
70
+ "minor": 0,
71
+ "patch": 0
72
+ }
73
+ }
examples/covost2_en_ta_test/state.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "fe170901fd58bb52",
8
+ "_format_columns": null,
9
+ "_format_kwargs": {},
10
+ "_format_type": null,
11
+ "_output_all_columns": false,
12
+ "_split": null
13
+ }
examples/covost2_en_zh_test/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aca2fa905173efcf428fd779b4e74ff132b8bab979f925e75ad7ff8b9b19aaa8
3
+ size 40016
examples/covost2_en_zh_test/dataset_info.json ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "builder_name": "parquet",
3
+ "citation": "",
4
+ "config_name": "default",
5
+ "dataset_name": "covost2_en_zh_test_v1",
6
+ "dataset_size": 2842110316,
7
+ "description": "",
8
+ "download_checksums": {
9
+ "hf://datasets/AudioLLMs/covost2_en_zh_test_v1@6fe92d7fabaee215b078b022abbe8959280f3187/data/test-00000-of-00006.parquet": {
10
+ "num_bytes": 421376507,
11
+ "checksum": null
12
+ },
13
+ "hf://datasets/AudioLLMs/covost2_en_zh_test_v1@6fe92d7fabaee215b078b022abbe8959280f3187/data/test-00001-of-00006.parquet": {
14
+ "num_bytes": 430362096,
15
+ "checksum": null
16
+ },
17
+ "hf://datasets/AudioLLMs/covost2_en_zh_test_v1@6fe92d7fabaee215b078b022abbe8959280f3187/data/test-00002-of-00006.parquet": {
18
+ "num_bytes": 423196814,
19
+ "checksum": null
20
+ },
21
+ "hf://datasets/AudioLLMs/covost2_en_zh_test_v1@6fe92d7fabaee215b078b022abbe8959280f3187/data/test-00003-of-00006.parquet": {
22
+ "num_bytes": 420938958,
23
+ "checksum": null
24
+ },
25
+ "hf://datasets/AudioLLMs/covost2_en_zh_test_v1@6fe92d7fabaee215b078b022abbe8959280f3187/data/test-00004-of-00006.parquet": {
26
+ "num_bytes": 419730286,
27
+ "checksum": null
28
+ },
29
+ "hf://datasets/AudioLLMs/covost2_en_zh_test_v1@6fe92d7fabaee215b078b022abbe8959280f3187/data/test-00005-of-00006.parquet": {
30
+ "num_bytes": 419958145,
31
+ "checksum": null
32
+ }
33
+ },
34
+ "download_size": 2535562806,
35
+ "features": {
36
+ "context": {
37
+ "_type": "Audio"
38
+ },
39
+ "instruction": {
40
+ "dtype": "string",
41
+ "_type": "Value"
42
+ },
43
+ "answer": {
44
+ "dtype": "string",
45
+ "_type": "Value"
46
+ }
47
+ },
48
+ "homepage": "",
49
+ "license": "",
50
+ "size_in_bytes": 5377673122,
51
+ "splits": {
52
+ "test": {
53
+ "name": "test",
54
+ "num_bytes": 2842110316,
55
+ "num_examples": 15531,
56
+ "shard_lengths": [
57
+ 2789,
58
+ 2789,
59
+ 2789,
60
+ 2788,
61
+ 2788,
62
+ 1588
63
+ ],
64
+ "dataset_name": "covost2_en_zh_test_v1"
65
+ }
66
+ },
67
+ "version": {
68
+ "version_str": "0.0.0",
69
+ "major": 0,
70
+ "minor": 0,
71
+ "patch": 0
72
+ }
73
+ }
examples/covost2_en_zh_test/state.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "7445fef56d00d00b",
8
+ "_format_columns": null,
9
+ "_format_kwargs": {},
10
+ "_format_type": null,
11
+ "_output_all_columns": false,
12
+ "_split": null
13
+ }
examples/covost2_id_en_test/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:573589410f93a7667f83d37bd30b472069e7446d2d5e05aa98fc4138b0fd316b
3
+ size 50736
examples/covost2_id_en_test/dataset_info.json ADDED
@@ -0,0 +1,45 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "builder_name": "parquet",
3
+ "citation": "",
4
+ "config_name": "default",
5
+ "dataset_name": "covost2_id_en_test_v1",
6
+ "dataset_size": 105217105,
7
+ "description": "",
8
+ "download_checksums": {
9
+ "hf://datasets/AudioLLMs/covost2_id_en_test_v1@3998e50bec6eefdae5b38278238c359acb583f4c/data/test-00000-of-00001.parquet": {
10
+ "num_bytes": 100225392,
11
+ "checksum": null
12
+ }
13
+ },
14
+ "download_size": 100225392,
15
+ "features": {
16
+ "context": {
17
+ "_type": "Audio"
18
+ },
19
+ "instruction": {
20
+ "dtype": "string",
21
+ "_type": "Value"
22
+ },
23
+ "answer": {
24
+ "dtype": "string",
25
+ "_type": "Value"
26
+ }
27
+ },
28
+ "homepage": "",
29
+ "license": "",
30
+ "size_in_bytes": 205442497,
31
+ "splits": {
32
+ "test": {
33
+ "name": "test",
34
+ "num_bytes": 105217105,
35
+ "num_examples": 844,
36
+ "dataset_name": "covost2_id_en_test_v1"
37
+ }
38
+ },
39
+ "version": {
40
+ "version_str": "0.0.0",
41
+ "major": 0,
42
+ "minor": 0,
43
+ "patch": 0
44
+ }
45
+ }