Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- examples/aishell_asr_zh_test/data-00000-of-00001.arrow +3 -0
- examples/aishell_asr_zh_test/dataset_info.json +58 -0
- examples/aishell_asr_zh_test/state.json +13 -0
- examples/alpaca_audio_test/data-00000-of-00001.arrow +3 -0
- examples/alpaca_audio_test/dataset_info.json +49 -0
- examples/alpaca_audio_test/state.json +13 -0
- examples/audiocaps_qa_test/data-00000-of-00001.arrow +3 -0
- examples/audiocaps_qa_test/dataset_info.json +45 -0
- examples/audiocaps_qa_test/state.json +13 -0
- examples/audiocaps_test/data-00000-of-00001.arrow +3 -0
- examples/audiocaps_test/dataset_info.json +58 -0
- examples/audiocaps_test/state.json +13 -0
- examples/clotho_aqa_test/data-00000-of-00001.arrow +3 -0
- examples/clotho_aqa_test/dataset_info.json +58 -0
- examples/clotho_aqa_test/state.json +13 -0
- examples/cn_college_listen_mcq_test/data-00000-of-00001.arrow +3 -0
- examples/cn_college_listen_mcq_test/dataset_info.json +66 -0
- examples/cn_college_listen_mcq_test/state.json +13 -0
- examples/cna_test/data-00000-of-00001.arrow +3 -0
- examples/cna_test/dataset_info.json +20 -0
- examples/cna_test/state.json +13 -0
- examples/common_voice_15_en_test/data-00000-of-00001.arrow +3 -0
- examples/common_voice_15_en_test/dataset_info.json +28 -0
- examples/common_voice_15_en_test/state.json +19 -0
- examples/commonvoice_17_id_asr/data-00000-of-00001.arrow +3 -0
- examples/commonvoice_17_id_asr/dataset_info.json +132 -0
- examples/commonvoice_17_id_asr/state.json +13 -0
- examples/commonvoice_17_ta_asr/data-00000-of-00001.arrow +3 -0
- examples/commonvoice_17_ta_asr/dataset_info.json +156 -0
- examples/commonvoice_17_ta_asr/state.json +13 -0
- examples/commonvoice_17_th_asr/data-00000-of-00001.arrow +3 -0
- examples/commonvoice_17_th_asr/dataset_info.json +164 -0
- examples/commonvoice_17_th_asr/state.json +13 -0
- examples/commonvoice_17_vi_asr/data-00000-of-00001.arrow +3 -0
- examples/commonvoice_17_vi_asr/dataset_info.json +132 -0
- examples/commonvoice_17_vi_asr/state.json +13 -0
- examples/commonvoice_zh_asr/data-00000-of-00001.arrow +3 -0
- examples/commonvoice_zh_asr/dataset_info.json +182 -0
- examples/commonvoice_zh_asr/state.json +13 -0
- examples/covost2_en_id_test/data-00000-of-00001.arrow +3 -0
- examples/covost2_en_id_test/dataset_info.json +73 -0
- examples/covost2_en_id_test/state.json +13 -0
- examples/covost2_en_ta_test/data-00000-of-00001.arrow +3 -0
- examples/covost2_en_ta_test/dataset_info.json +73 -0
- examples/covost2_en_ta_test/state.json +13 -0
- examples/covost2_en_zh_test/data-00000-of-00001.arrow +3 -0
- examples/covost2_en_zh_test/dataset_info.json +73 -0
- examples/covost2_en_zh_test/state.json +13 -0
- examples/covost2_id_en_test/data-00000-of-00001.arrow +3 -0
- examples/covost2_id_en_test/dataset_info.json +45 -0
examples/aishell_asr_zh_test/data-00000-of-00001.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d8ed27441c9a5f6ac8b38e27b52ce555fe03322530ff16c16f2796c9f6e7f45
|
3 |
+
size 44296
|
examples/aishell_asr_zh_test/dataset_info.json
ADDED
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"builder_name": "parquet",
|
3 |
+
"citation": "",
|
4 |
+
"config_name": "default",
|
5 |
+
"dataset_name": "aishell_asr_zh_test_v1",
|
6 |
+
"dataset_size": 1115469955,
|
7 |
+
"description": "",
|
8 |
+
"download_checksums": {
|
9 |
+
"hf://datasets/AudioLLMs/aishell_asr_zh_test_v1@e73dc7f096ecea5c8e5c722446c8d3b4014fdd18/data/test-00000-of-00003.parquet": {
|
10 |
+
"num_bytes": 364047728,
|
11 |
+
"checksum": null
|
12 |
+
},
|
13 |
+
"hf://datasets/AudioLLMs/aishell_asr_zh_test_v1@e73dc7f096ecea5c8e5c722446c8d3b4014fdd18/data/test-00001-of-00003.parquet": {
|
14 |
+
"num_bytes": 354834886,
|
15 |
+
"checksum": null
|
16 |
+
},
|
17 |
+
"hf://datasets/AudioLLMs/aishell_asr_zh_test_v1@e73dc7f096ecea5c8e5c722446c8d3b4014fdd18/data/test-00002-of-00003.parquet": {
|
18 |
+
"num_bytes": 377041689,
|
19 |
+
"checksum": null
|
20 |
+
}
|
21 |
+
},
|
22 |
+
"download_size": 1095924303,
|
23 |
+
"features": {
|
24 |
+
"context": {
|
25 |
+
"_type": "Audio"
|
26 |
+
},
|
27 |
+
"instruction": {
|
28 |
+
"dtype": "string",
|
29 |
+
"_type": "Value"
|
30 |
+
},
|
31 |
+
"answer": {
|
32 |
+
"dtype": "string",
|
33 |
+
"_type": "Value"
|
34 |
+
}
|
35 |
+
},
|
36 |
+
"homepage": "",
|
37 |
+
"license": "",
|
38 |
+
"size_in_bytes": 2211394258,
|
39 |
+
"splits": {
|
40 |
+
"test": {
|
41 |
+
"name": "test",
|
42 |
+
"num_bytes": 1115469955,
|
43 |
+
"num_examples": 6920,
|
44 |
+
"shard_lengths": [
|
45 |
+
3207,
|
46 |
+
3107,
|
47 |
+
606
|
48 |
+
],
|
49 |
+
"dataset_name": "aishell_asr_zh_test_v1"
|
50 |
+
}
|
51 |
+
},
|
52 |
+
"version": {
|
53 |
+
"version_str": "0.0.0",
|
54 |
+
"major": 0,
|
55 |
+
"minor": 0,
|
56 |
+
"patch": 0
|
57 |
+
}
|
58 |
+
}
|
examples/aishell_asr_zh_test/state.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_data_files": [
|
3 |
+
{
|
4 |
+
"filename": "data-00000-of-00001.arrow"
|
5 |
+
}
|
6 |
+
],
|
7 |
+
"_fingerprint": "5a1f0f8b9b3ca365",
|
8 |
+
"_format_columns": null,
|
9 |
+
"_format_kwargs": {},
|
10 |
+
"_format_type": null,
|
11 |
+
"_output_all_columns": false,
|
12 |
+
"_split": null
|
13 |
+
}
|
examples/alpaca_audio_test/data-00000-of-00001.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:acbe0fbf69f6732a358e6c6575354464b9c5e39b87be73cc9f1ae7c284e9e575
|
3 |
+
size 44600
|
examples/alpaca_audio_test/dataset_info.json
ADDED
@@ -0,0 +1,49 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"builder_name": "parquet",
|
3 |
+
"citation": "",
|
4 |
+
"config_name": "default",
|
5 |
+
"dataset_name": "alpaca_audio_test",
|
6 |
+
"dataset_size": 13865321,
|
7 |
+
"description": "",
|
8 |
+
"download_checksums": {
|
9 |
+
"hf://datasets/AudioLLMs/alpaca_audio_test@7eb2ab279975033690d67bee66e45eb612a430ee/data/test-00000-of-00001.parquet": {
|
10 |
+
"num_bytes": 12245608,
|
11 |
+
"checksum": null
|
12 |
+
}
|
13 |
+
},
|
14 |
+
"download_size": 12245608,
|
15 |
+
"features": {
|
16 |
+
"context": {
|
17 |
+
"_type": "Audio"
|
18 |
+
},
|
19 |
+
"instruction": {
|
20 |
+
"dtype": "string",
|
21 |
+
"_type": "Value"
|
22 |
+
},
|
23 |
+
"speech_instruction": {
|
24 |
+
"dtype": "string",
|
25 |
+
"_type": "Value"
|
26 |
+
},
|
27 |
+
"answer": {
|
28 |
+
"dtype": "string",
|
29 |
+
"_type": "Value"
|
30 |
+
}
|
31 |
+
},
|
32 |
+
"homepage": "",
|
33 |
+
"license": "",
|
34 |
+
"size_in_bytes": 26110929,
|
35 |
+
"splits": {
|
36 |
+
"test": {
|
37 |
+
"name": "test",
|
38 |
+
"num_bytes": 13865321,
|
39 |
+
"num_examples": 100,
|
40 |
+
"dataset_name": "alpaca_audio_test"
|
41 |
+
}
|
42 |
+
},
|
43 |
+
"version": {
|
44 |
+
"version_str": "0.0.0",
|
45 |
+
"major": 0,
|
46 |
+
"minor": 0,
|
47 |
+
"patch": 0
|
48 |
+
}
|
49 |
+
}
|
examples/alpaca_audio_test/state.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_data_files": [
|
3 |
+
{
|
4 |
+
"filename": "data-00000-of-00001.arrow"
|
5 |
+
}
|
6 |
+
],
|
7 |
+
"_fingerprint": "a7169220e58f4523",
|
8 |
+
"_format_columns": null,
|
9 |
+
"_format_kwargs": {},
|
10 |
+
"_format_type": null,
|
11 |
+
"_output_all_columns": false,
|
12 |
+
"_split": null
|
13 |
+
}
|
examples/audiocaps_qa_test/data-00000-of-00001.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc4745b0e32ece9d9f32f5a5a689eb5e24ca6755f114cd2b1f1f445819fa1375
|
3 |
+
size 103208
|
examples/audiocaps_qa_test/dataset_info.json
ADDED
@@ -0,0 +1,45 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"builder_name": "parquet",
|
3 |
+
"citation": "",
|
4 |
+
"config_name": "default",
|
5 |
+
"dataset_name": "audiocaps_qa_test_v3",
|
6 |
+
"dataset_size": 98835422,
|
7 |
+
"description": "",
|
8 |
+
"download_checksums": {
|
9 |
+
"hf://datasets/AudioLLMs/audiocaps_qa_test_v3@6cf6853c52f55482126f226a8859eb71f2021e0e/data/test-00000-of-00001.parquet": {
|
10 |
+
"num_bytes": 92241687,
|
11 |
+
"checksum": null
|
12 |
+
}
|
13 |
+
},
|
14 |
+
"download_size": 92241687,
|
15 |
+
"features": {
|
16 |
+
"context": {
|
17 |
+
"_type": "Audio"
|
18 |
+
},
|
19 |
+
"instruction": {
|
20 |
+
"dtype": "string",
|
21 |
+
"_type": "Value"
|
22 |
+
},
|
23 |
+
"answer": {
|
24 |
+
"dtype": "string",
|
25 |
+
"_type": "Value"
|
26 |
+
}
|
27 |
+
},
|
28 |
+
"homepage": "",
|
29 |
+
"license": "",
|
30 |
+
"size_in_bytes": 191077109,
|
31 |
+
"splits": {
|
32 |
+
"test": {
|
33 |
+
"name": "test",
|
34 |
+
"num_bytes": 98835422,
|
35 |
+
"num_examples": 313,
|
36 |
+
"dataset_name": "audiocaps_qa_test_v3"
|
37 |
+
}
|
38 |
+
},
|
39 |
+
"version": {
|
40 |
+
"version_str": "0.0.0",
|
41 |
+
"major": 0,
|
42 |
+
"minor": 0,
|
43 |
+
"patch": 0
|
44 |
+
}
|
45 |
+
}
|
examples/audiocaps_qa_test/state.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_data_files": [
|
3 |
+
{
|
4 |
+
"filename": "data-00000-of-00001.arrow"
|
5 |
+
}
|
6 |
+
],
|
7 |
+
"_fingerprint": "748c6693112f77f2",
|
8 |
+
"_format_columns": null,
|
9 |
+
"_format_kwargs": {},
|
10 |
+
"_format_type": null,
|
11 |
+
"_output_all_columns": false,
|
12 |
+
"_split": null
|
13 |
+
}
|
examples/audiocaps_test/data-00000-of-00001.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9cfff9093667c39e6750f23693d4d817193a0fbb829e3c6155d4a4c44462a184
|
3 |
+
size 107320
|
examples/audiocaps_test/dataset_info.json
ADDED
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"builder_name": "parquet",
|
3 |
+
"citation": "",
|
4 |
+
"config_name": "default",
|
5 |
+
"dataset_name": "audiocaps_test",
|
6 |
+
"dataset_size": 1389113784,
|
7 |
+
"description": "",
|
8 |
+
"download_checksums": {
|
9 |
+
"hf://datasets/AudioLLMs/audiocaps_test@fb42aac15212cbddd723fbbf04b6071b60a9f8fe/data/test-00000-of-00003.parquet": {
|
10 |
+
"num_bytes": 432299885,
|
11 |
+
"checksum": null
|
12 |
+
},
|
13 |
+
"hf://datasets/AudioLLMs/audiocaps_test@fb42aac15212cbddd723fbbf04b6071b60a9f8fe/data/test-00001-of-00003.parquet": {
|
14 |
+
"num_bytes": 435786346,
|
15 |
+
"checksum": null
|
16 |
+
},
|
17 |
+
"hf://datasets/AudioLLMs/audiocaps_test@fb42aac15212cbddd723fbbf04b6071b60a9f8fe/data/test-00002-of-00003.parquet": {
|
18 |
+
"num_bytes": 435930887,
|
19 |
+
"checksum": null
|
20 |
+
}
|
21 |
+
},
|
22 |
+
"download_size": 1304017118,
|
23 |
+
"features": {
|
24 |
+
"context": {
|
25 |
+
"_type": "Audio"
|
26 |
+
},
|
27 |
+
"instruction": {
|
28 |
+
"dtype": "string",
|
29 |
+
"_type": "Value"
|
30 |
+
},
|
31 |
+
"answer": {
|
32 |
+
"dtype": "string",
|
33 |
+
"_type": "Value"
|
34 |
+
}
|
35 |
+
},
|
36 |
+
"homepage": "",
|
37 |
+
"license": "",
|
38 |
+
"size_in_bytes": 2693130902,
|
39 |
+
"splits": {
|
40 |
+
"test": {
|
41 |
+
"name": "test",
|
42 |
+
"num_bytes": 1389113784,
|
43 |
+
"num_examples": 4400,
|
44 |
+
"shard_lengths": [
|
45 |
+
1667,
|
46 |
+
1667,
|
47 |
+
1066
|
48 |
+
],
|
49 |
+
"dataset_name": "audiocaps_test"
|
50 |
+
}
|
51 |
+
},
|
52 |
+
"version": {
|
53 |
+
"version_str": "0.0.0",
|
54 |
+
"major": 0,
|
55 |
+
"minor": 0,
|
56 |
+
"patch": 0
|
57 |
+
}
|
58 |
+
}
|
examples/audiocaps_test/state.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_data_files": [
|
3 |
+
{
|
4 |
+
"filename": "data-00000-of-00001.arrow"
|
5 |
+
}
|
6 |
+
],
|
7 |
+
"_fingerprint": "1872292586a4b460",
|
8 |
+
"_format_columns": null,
|
9 |
+
"_format_kwargs": {},
|
10 |
+
"_format_type": null,
|
11 |
+
"_output_all_columns": false,
|
12 |
+
"_split": null
|
13 |
+
}
|
examples/clotho_aqa_test/data-00000-of-00001.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ad7fcb1e24f43a32efd32f08888b84f2ff5ebd275e43ca26e6230c7d01922cf
|
3 |
+
size 194400
|
examples/clotho_aqa_test/dataset_info.json
ADDED
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"builder_name": "parquet",
|
3 |
+
"citation": "",
|
4 |
+
"config_name": "default",
|
5 |
+
"dataset_name": "clotho_asqa_test_v2",
|
6 |
+
"dataset_size": 1485321871,
|
7 |
+
"description": "",
|
8 |
+
"download_checksums": {
|
9 |
+
"hf://datasets/AudioLLMs/clotho_asqa_test_v2@a7f4a7983d490e87a79eb041fede83e418c0ea4f/data/test-00000-of-00003.parquet": {
|
10 |
+
"num_bytes": 118559858,
|
11 |
+
"checksum": null
|
12 |
+
},
|
13 |
+
"hf://datasets/AudioLLMs/clotho_asqa_test_v2@a7f4a7983d490e87a79eb041fede83e418c0ea4f/data/test-00001-of-00003.parquet": {
|
14 |
+
"num_bytes": 116519615,
|
15 |
+
"checksum": null
|
16 |
+
},
|
17 |
+
"hf://datasets/AudioLLMs/clotho_asqa_test_v2@a7f4a7983d490e87a79eb041fede83e418c0ea4f/data/test-00002-of-00003.parquet": {
|
18 |
+
"num_bytes": 113032047,
|
19 |
+
"checksum": null
|
20 |
+
}
|
21 |
+
},
|
22 |
+
"download_size": 348111520,
|
23 |
+
"features": {
|
24 |
+
"context": {
|
25 |
+
"_type": "Audio"
|
26 |
+
},
|
27 |
+
"instruction": {
|
28 |
+
"dtype": "string",
|
29 |
+
"_type": "Value"
|
30 |
+
},
|
31 |
+
"answer": {
|
32 |
+
"dtype": "string",
|
33 |
+
"_type": "Value"
|
34 |
+
}
|
35 |
+
},
|
36 |
+
"homepage": "",
|
37 |
+
"license": "",
|
38 |
+
"size_in_bytes": 1833433391,
|
39 |
+
"splits": {
|
40 |
+
"test": {
|
41 |
+
"name": "test",
|
42 |
+
"num_bytes": 1485321871,
|
43 |
+
"num_examples": 2057,
|
44 |
+
"shard_lengths": [
|
45 |
+
786,
|
46 |
+
786,
|
47 |
+
485
|
48 |
+
],
|
49 |
+
"dataset_name": "clotho_asqa_test_v2"
|
50 |
+
}
|
51 |
+
},
|
52 |
+
"version": {
|
53 |
+
"version_str": "0.0.0",
|
54 |
+
"major": 0,
|
55 |
+
"minor": 0,
|
56 |
+
"patch": 0
|
57 |
+
}
|
58 |
+
}
|
examples/clotho_aqa_test/state.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_data_files": [
|
3 |
+
{
|
4 |
+
"filename": "data-00000-of-00001.arrow"
|
5 |
+
}
|
6 |
+
],
|
7 |
+
"_fingerprint": "35d1627b19106626",
|
8 |
+
"_format_columns": null,
|
9 |
+
"_format_kwargs": {},
|
10 |
+
"_format_type": null,
|
11 |
+
"_output_all_columns": false,
|
12 |
+
"_split": null
|
13 |
+
}
|
examples/cn_college_listen_mcq_test/data-00000-of-00001.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3131dbbd9306a9622d446f8f151f1db0dd7ba3a14bd82f711126d159a813d5d5
|
3 |
+
size 152776
|
examples/cn_college_listen_mcq_test/dataset_info.json
ADDED
@@ -0,0 +1,66 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"builder_name": "parquet",
|
3 |
+
"citation": "",
|
4 |
+
"config_name": "default",
|
5 |
+
"dataset_name": "cn_college_listen_mcq_test",
|
6 |
+
"dataset_size": 1532841284,
|
7 |
+
"description": "",
|
8 |
+
"download_checksums": {
|
9 |
+
"hf://datasets/AudioLLMs/cn_college_listen_mcq_test@708d8ef278b5eadae714c314889f5d81ded18a25/data/test-00000-of-00004.parquet": {
|
10 |
+
"num_bytes": 283046288,
|
11 |
+
"checksum": null
|
12 |
+
},
|
13 |
+
"hf://datasets/AudioLLMs/cn_college_listen_mcq_test@708d8ef278b5eadae714c314889f5d81ded18a25/data/test-00001-of-00004.parquet": {
|
14 |
+
"num_bytes": 241939389,
|
15 |
+
"checksum": null
|
16 |
+
},
|
17 |
+
"hf://datasets/AudioLLMs/cn_college_listen_mcq_test@708d8ef278b5eadae714c314889f5d81ded18a25/data/test-00002-of-00004.parquet": {
|
18 |
+
"num_bytes": 248376444,
|
19 |
+
"checksum": null
|
20 |
+
},
|
21 |
+
"hf://datasets/AudioLLMs/cn_college_listen_mcq_test@708d8ef278b5eadae714c314889f5d81ded18a25/data/test-00003-of-00004.parquet": {
|
22 |
+
"num_bytes": 256294919,
|
23 |
+
"checksum": null
|
24 |
+
}
|
25 |
+
},
|
26 |
+
"download_size": 1029657040,
|
27 |
+
"features": {
|
28 |
+
"context": {
|
29 |
+
"_type": "Audio"
|
30 |
+
},
|
31 |
+
"instruction": {
|
32 |
+
"dtype": "string",
|
33 |
+
"_type": "Value"
|
34 |
+
},
|
35 |
+
"choices": {
|
36 |
+
"dtype": "string",
|
37 |
+
"_type": "Value"
|
38 |
+
},
|
39 |
+
"answer": {
|
40 |
+
"dtype": "string",
|
41 |
+
"_type": "Value"
|
42 |
+
}
|
43 |
+
},
|
44 |
+
"homepage": "",
|
45 |
+
"license": "",
|
46 |
+
"size_in_bytes": 2562498324,
|
47 |
+
"splits": {
|
48 |
+
"test": {
|
49 |
+
"name": "test",
|
50 |
+
"num_bytes": 1532841284,
|
51 |
+
"num_examples": 2271,
|
52 |
+
"shard_lengths": [
|
53 |
+
500,
|
54 |
+
1036,
|
55 |
+
735
|
56 |
+
],
|
57 |
+
"dataset_name": "cn_college_listen_mcq_test"
|
58 |
+
}
|
59 |
+
},
|
60 |
+
"version": {
|
61 |
+
"version_str": "0.0.0",
|
62 |
+
"major": 0,
|
63 |
+
"minor": 0,
|
64 |
+
"patch": 0
|
65 |
+
}
|
66 |
+
}
|
examples/cn_college_listen_mcq_test/state.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_data_files": [
|
3 |
+
{
|
4 |
+
"filename": "data-00000-of-00001.arrow"
|
5 |
+
}
|
6 |
+
],
|
7 |
+
"_fingerprint": "d42e39c8837074fc",
|
8 |
+
"_format_columns": null,
|
9 |
+
"_format_kwargs": {},
|
10 |
+
"_format_type": null,
|
11 |
+
"_output_all_columns": false,
|
12 |
+
"_split": null
|
13 |
+
}
|
examples/cna_test/data-00000-of-00001.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d37e6858c1291ebeb2bcb6bfbe8f5291da48f4199a46ae88a60eb57fa135b61f
|
3 |
+
size 34600
|
examples/cna_test/dataset_info.json
ADDED
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"citation": "",
|
3 |
+
"description": "",
|
4 |
+
"features": {
|
5 |
+
"context": {
|
6 |
+
"sampling_rate": 16000,
|
7 |
+
"_type": "Audio"
|
8 |
+
},
|
9 |
+
"instruction": {
|
10 |
+
"dtype": "string",
|
11 |
+
"_type": "Value"
|
12 |
+
},
|
13 |
+
"answer": {
|
14 |
+
"dtype": "string",
|
15 |
+
"_type": "Value"
|
16 |
+
}
|
17 |
+
},
|
18 |
+
"homepage": "",
|
19 |
+
"license": ""
|
20 |
+
}
|
examples/cna_test/state.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_data_files": [
|
3 |
+
{
|
4 |
+
"filename": "data-00000-of-00001.arrow"
|
5 |
+
}
|
6 |
+
],
|
7 |
+
"_fingerprint": "22ae0abf541af796",
|
8 |
+
"_format_columns": null,
|
9 |
+
"_format_kwargs": {},
|
10 |
+
"_format_type": null,
|
11 |
+
"_output_all_columns": false,
|
12 |
+
"_split": null
|
13 |
+
}
|
examples/common_voice_15_en_test/data-00000-of-00001.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd5f49efa47828a4a7b9a6fc584b19562acae2f90451219939b0c11b4d41621f
|
3 |
+
size 54992
|
examples/common_voice_15_en_test/dataset_info.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"citation": "",
|
3 |
+
"description": "",
|
4 |
+
"features": {
|
5 |
+
"context": {
|
6 |
+
"sampling_rate": 16000,
|
7 |
+
"_type": "Audio"
|
8 |
+
},
|
9 |
+
"instruction": {
|
10 |
+
"dtype": "string",
|
11 |
+
"_type": "Value"
|
12 |
+
},
|
13 |
+
"answer": {
|
14 |
+
"dtype": "string",
|
15 |
+
"_type": "Value"
|
16 |
+
},
|
17 |
+
"language": {
|
18 |
+
"dtype": "string",
|
19 |
+
"_type": "Value"
|
20 |
+
},
|
21 |
+
"audio_length": {
|
22 |
+
"dtype": "float64",
|
23 |
+
"_type": "Value"
|
24 |
+
}
|
25 |
+
},
|
26 |
+
"homepage": "",
|
27 |
+
"license": ""
|
28 |
+
}
|
examples/common_voice_15_en_test/state.json
ADDED
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_data_files": [
|
3 |
+
{
|
4 |
+
"filename": "data-00000-of-00001.arrow"
|
5 |
+
}
|
6 |
+
],
|
7 |
+
"_fingerprint": "62012827f888a0f5",
|
8 |
+
"_format_columns": [
|
9 |
+
"answer",
|
10 |
+
"audio_length",
|
11 |
+
"context",
|
12 |
+
"instruction",
|
13 |
+
"language"
|
14 |
+
],
|
15 |
+
"_format_kwargs": {},
|
16 |
+
"_format_type": null,
|
17 |
+
"_output_all_columns": false,
|
18 |
+
"_split": null
|
19 |
+
}
|
examples/commonvoice_17_id_asr/data-00000-of-00001.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae05a4b823184603908f2b4149190b4fab9965be5468f6b4fa34e0e214c97760
|
3 |
+
size 43784
|
examples/commonvoice_17_id_asr/dataset_info.json
ADDED
@@ -0,0 +1,132 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"builder_name": "common_voice_17_0",
|
3 |
+
"citation": "@inproceedings{commonvoice:2020,\n author = {Ardila, R. and Branson, M. and Davis, K. and Henretty, M. and Kohler, M. and Meyer, J. and Morais, R. and Saunders, L. and Tyers, F. M. and Weber, G.},\n title = {Common Voice: A Massively-Multilingual Speech Corpus},\n booktitle = {Proceedings of the 12th Conference on Language Resources and Evaluation (LREC 2020)},\n pages = {4211--4215},\n year = 2020\n}\n",
|
4 |
+
"config_name": "id",
|
5 |
+
"dataset_name": "common_voice_17_0",
|
6 |
+
"dataset_size": 42157018,
|
7 |
+
"description": "Common Voice is Mozilla's initiative to help teach machines how real people speak. The dataset currently consists of 20408 validated hours of speech in 124 languages, but more voices and languages are always added.",
|
8 |
+
"download_checksums": {
|
9 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/n_shards.json": {
|
10 |
+
"num_bytes": 17491,
|
11 |
+
"checksum": null
|
12 |
+
},
|
13 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/id/train/id_train_0.tar": {
|
14 |
+
"num_bytes": 170035200,
|
15 |
+
"checksum": null
|
16 |
+
},
|
17 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/id/dev/id_dev_0.tar": {
|
18 |
+
"num_bytes": 102236160,
|
19 |
+
"checksum": null
|
20 |
+
},
|
21 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/id/test/id_test_0.tar": {
|
22 |
+
"num_bytes": 110315520,
|
23 |
+
"checksum": null
|
24 |
+
},
|
25 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/id/other/id_other_0.tar": {
|
26 |
+
"num_bytes": 686858240,
|
27 |
+
"checksum": null
|
28 |
+
},
|
29 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/id/invalidated/id_invalidated_0.tar": {
|
30 |
+
"num_bytes": 68034560,
|
31 |
+
"checksum": null
|
32 |
+
},
|
33 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/id/validated/id_validated_0.tar": {
|
34 |
+
"num_bytes": 805611520,
|
35 |
+
"checksum": null
|
36 |
+
},
|
37 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/id/train.tsv": {
|
38 |
+
"num_bytes": 1571021,
|
39 |
+
"checksum": null
|
40 |
+
},
|
41 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/id/dev.tsv": {
|
42 |
+
"num_bytes": 1016964,
|
43 |
+
"checksum": null
|
44 |
+
},
|
45 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/id/test.tsv": {
|
46 |
+
"num_bytes": 1052525,
|
47 |
+
"checksum": null
|
48 |
+
},
|
49 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/id/other.tsv": {
|
50 |
+
"num_bytes": 8607181,
|
51 |
+
"checksum": null
|
52 |
+
},
|
53 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/id/invalidated.tsv": {
|
54 |
+
"num_bytes": 784798,
|
55 |
+
"checksum": null
|
56 |
+
},
|
57 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/id/validated.tsv": {
|
58 |
+
"num_bytes": 7772548,
|
59 |
+
"checksum": null
|
60 |
+
}
|
61 |
+
},
|
62 |
+
"download_size": 1963913728,
|
63 |
+
"features": {
|
64 |
+
"context": {
|
65 |
+
"sampling_rate": 16000,
|
66 |
+
"_type": "Audio"
|
67 |
+
},
|
68 |
+
"instruction": {
|
69 |
+
"dtype": "string",
|
70 |
+
"_type": "Value"
|
71 |
+
},
|
72 |
+
"answer": {
|
73 |
+
"dtype": "string",
|
74 |
+
"_type": "Value"
|
75 |
+
},
|
76 |
+
"audio_length": {
|
77 |
+
"dtype": "float64",
|
78 |
+
"_type": "Value"
|
79 |
+
},
|
80 |
+
"language": {
|
81 |
+
"dtype": "string",
|
82 |
+
"_type": "Value"
|
83 |
+
}
|
84 |
+
},
|
85 |
+
"homepage": "https://commonvoice.mozilla.org/en/datasets",
|
86 |
+
"license": "https://creativecommons.org/publicdomain/zero/1.0/",
|
87 |
+
"size_in_bytes": 2006070746,
|
88 |
+
"splits": {
|
89 |
+
"train": {
|
90 |
+
"name": "train",
|
91 |
+
"num_bytes": 3067499,
|
92 |
+
"num_examples": 4970,
|
93 |
+
"dataset_name": "common_voice_17_0"
|
94 |
+
},
|
95 |
+
"validation": {
|
96 |
+
"name": "validation",
|
97 |
+
"num_bytes": 2011909,
|
98 |
+
"num_examples": 3349,
|
99 |
+
"dataset_name": "common_voice_17_0"
|
100 |
+
},
|
101 |
+
"test": {
|
102 |
+
"name": "test",
|
103 |
+
"num_bytes": 2141524,
|
104 |
+
"num_examples": 3641,
|
105 |
+
"dataset_name": "common_voice_17_0"
|
106 |
+
},
|
107 |
+
"other": {
|
108 |
+
"name": "other",
|
109 |
+
"num_bytes": 17492664,
|
110 |
+
"num_examples": 29508,
|
111 |
+
"dataset_name": "common_voice_17_0"
|
112 |
+
},
|
113 |
+
"invalidated": {
|
114 |
+
"name": "invalidated",
|
115 |
+
"num_bytes": 1600375,
|
116 |
+
"num_examples": 2605,
|
117 |
+
"dataset_name": "common_voice_17_0"
|
118 |
+
},
|
119 |
+
"validated": {
|
120 |
+
"name": "validated",
|
121 |
+
"num_bytes": 15843047,
|
122 |
+
"num_examples": 26108,
|
123 |
+
"dataset_name": "common_voice_17_0"
|
124 |
+
}
|
125 |
+
},
|
126 |
+
"version": {
|
127 |
+
"version_str": "17.0.0",
|
128 |
+
"major": 17,
|
129 |
+
"minor": 0,
|
130 |
+
"patch": 0
|
131 |
+
}
|
132 |
+
}
|
examples/commonvoice_17_id_asr/state.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_data_files": [
|
3 |
+
{
|
4 |
+
"filename": "data-00000-of-00001.arrow"
|
5 |
+
}
|
6 |
+
],
|
7 |
+
"_fingerprint": "75931a254b089787",
|
8 |
+
"_format_columns": null,
|
9 |
+
"_format_kwargs": {},
|
10 |
+
"_format_type": null,
|
11 |
+
"_output_all_columns": false,
|
12 |
+
"_split": null
|
13 |
+
}
|
examples/commonvoice_17_ta_asr/data-00000-of-00001.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98470c84b50bb5c1b10476e4f6ea518ddd9127b64b0c680302f774af7b538b71
|
3 |
+
size 90616
|
examples/commonvoice_17_ta_asr/dataset_info.json
ADDED
@@ -0,0 +1,156 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"builder_name": "common_voice_17_0",
|
3 |
+
"citation": "@inproceedings{commonvoice:2020,\n author = {Ardila, R. and Branson, M. and Davis, K. and Henretty, M. and Kohler, M. and Meyer, J. and Morais, R. and Saunders, L. and Tyers, F. M. and Weber, G.},\n title = {Common Voice: A Massively-Multilingual Speech Corpus},\n booktitle = {Proceedings of the 12th Conference on Language Resources and Evaluation (LREC 2020)},\n pages = {4211--4215},\n year = 2020\n}\n",
|
4 |
+
"config_name": "ta",
|
5 |
+
"dataset_name": "common_voice_17_0",
|
6 |
+
"dataset_size": 221361139,
|
7 |
+
"description": "Common Voice is Mozilla's initiative to help teach machines how real people speak. The dataset currently consists of 20408 validated hours of speech in 124 languages, but more voices and languages are always added.",
|
8 |
+
"download_checksums": {
|
9 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/n_shards.json": {
|
10 |
+
"num_bytes": 17491,
|
11 |
+
"checksum": null
|
12 |
+
},
|
13 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/train/ta_train_0.tar": {
|
14 |
+
"num_bytes": 1598955520,
|
15 |
+
"checksum": null
|
16 |
+
},
|
17 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/train/ta_train_1.tar": {
|
18 |
+
"num_bytes": 224542720,
|
19 |
+
"checksum": null
|
20 |
+
},
|
21 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/dev/ta_dev_0.tar": {
|
22 |
+
"num_bytes": 434257920,
|
23 |
+
"checksum": null
|
24 |
+
},
|
25 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/test/ta_test_0.tar": {
|
26 |
+
"num_bytes": 454778880,
|
27 |
+
"checksum": null
|
28 |
+
},
|
29 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/other/ta_other_0.tar": {
|
30 |
+
"num_bytes": 1560514560,
|
31 |
+
"checksum": null
|
32 |
+
},
|
33 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/other/ta_other_1.tar": {
|
34 |
+
"num_bytes": 1515827200,
|
35 |
+
"checksum": null
|
36 |
+
},
|
37 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/other/ta_other_2.tar": {
|
38 |
+
"num_bytes": 495831040,
|
39 |
+
"checksum": null
|
40 |
+
},
|
41 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/invalidated/ta_invalidated_0.tar": {
|
42 |
+
"num_bytes": 231424000,
|
43 |
+
"checksum": null
|
44 |
+
},
|
45 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/validated/ta_validated_0.tar": {
|
46 |
+
"num_bytes": 1447434240,
|
47 |
+
"checksum": null
|
48 |
+
},
|
49 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/validated/ta_validated_1.tar": {
|
50 |
+
"num_bytes": 1530644480,
|
51 |
+
"checksum": null
|
52 |
+
},
|
53 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/validated/ta_validated_2.tar": {
|
54 |
+
"num_bytes": 1654978560,
|
55 |
+
"checksum": null
|
56 |
+
},
|
57 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/ta/validated/ta_validated_3.tar": {
|
58 |
+
"num_bytes": 652861440,
|
59 |
+
"checksum": null
|
60 |
+
},
|
61 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/ta/train.tsv": {
|
62 |
+
"num_bytes": 19608830,
|
63 |
+
"checksum": null
|
64 |
+
},
|
65 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/ta/dev.tsv": {
|
66 |
+
"num_bytes": 5203704,
|
67 |
+
"checksum": null
|
68 |
+
},
|
69 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/ta/test.tsv": {
|
70 |
+
"num_bytes": 4944646,
|
71 |
+
"checksum": null
|
72 |
+
},
|
73 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/ta/other.tsv": {
|
74 |
+
"num_bytes": 39470943,
|
75 |
+
"checksum": null
|
76 |
+
},
|
77 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/ta/invalidated.tsv": {
|
78 |
+
"num_bytes": 2499761,
|
79 |
+
"checksum": null
|
80 |
+
},
|
81 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/ta/validated.tsv": {
|
82 |
+
"num_bytes": 56763398,
|
83 |
+
"checksum": null
|
84 |
+
}
|
85 |
+
},
|
86 |
+
"download_size": 11930559333,
|
87 |
+
"features": {
|
88 |
+
"context": {
|
89 |
+
"sampling_rate": 16000,
|
90 |
+
"_type": "Audio"
|
91 |
+
},
|
92 |
+
"instruction": {
|
93 |
+
"dtype": "string",
|
94 |
+
"_type": "Value"
|
95 |
+
},
|
96 |
+
"answer": {
|
97 |
+
"dtype": "string",
|
98 |
+
"_type": "Value"
|
99 |
+
},
|
100 |
+
"audio_length": {
|
101 |
+
"dtype": "float64",
|
102 |
+
"_type": "Value"
|
103 |
+
},
|
104 |
+
"language": {
|
105 |
+
"dtype": "string",
|
106 |
+
"_type": "Value"
|
107 |
+
}
|
108 |
+
},
|
109 |
+
"homepage": "https://commonvoice.mozilla.org/en/datasets",
|
110 |
+
"license": "https://creativecommons.org/publicdomain/zero/1.0/",
|
111 |
+
"size_in_bytes": 12151920472,
|
112 |
+
"splits": {
|
113 |
+
"train": {
|
114 |
+
"name": "train",
|
115 |
+
"num_bytes": 33336098,
|
116 |
+
"num_examples": 45587,
|
117 |
+
"dataset_name": "common_voice_17_0"
|
118 |
+
},
|
119 |
+
"validation": {
|
120 |
+
"name": "validation",
|
121 |
+
"num_bytes": 8797317,
|
122 |
+
"num_examples": 12095,
|
123 |
+
"dataset_name": "common_voice_17_0"
|
124 |
+
},
|
125 |
+
"test": {
|
126 |
+
"name": "test",
|
127 |
+
"num_bytes": 8556167,
|
128 |
+
"num_examples": 12074,
|
129 |
+
"dataset_name": "common_voice_17_0"
|
130 |
+
},
|
131 |
+
"other": {
|
132 |
+
"name": "other",
|
133 |
+
"num_bytes": 67773267,
|
134 |
+
"num_examples": 93989,
|
135 |
+
"dataset_name": "common_voice_17_0"
|
136 |
+
},
|
137 |
+
"invalidated": {
|
138 |
+
"name": "invalidated",
|
139 |
+
"num_bytes": 4282268,
|
140 |
+
"num_examples": 5693,
|
141 |
+
"dataset_name": "common_voice_17_0"
|
142 |
+
},
|
143 |
+
"validated": {
|
144 |
+
"name": "validated",
|
145 |
+
"num_bytes": 98616022,
|
146 |
+
"num_examples": 135391,
|
147 |
+
"dataset_name": "common_voice_17_0"
|
148 |
+
}
|
149 |
+
},
|
150 |
+
"version": {
|
151 |
+
"version_str": "17.0.0",
|
152 |
+
"major": 17,
|
153 |
+
"minor": 0,
|
154 |
+
"patch": 0
|
155 |
+
}
|
156 |
+
}
|
examples/commonvoice_17_ta_asr/state.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_data_files": [
|
3 |
+
{
|
4 |
+
"filename": "data-00000-of-00001.arrow"
|
5 |
+
}
|
6 |
+
],
|
7 |
+
"_fingerprint": "380f8a99e8b3657c",
|
8 |
+
"_format_columns": null,
|
9 |
+
"_format_kwargs": {},
|
10 |
+
"_format_type": null,
|
11 |
+
"_output_all_columns": false,
|
12 |
+
"_split": null
|
13 |
+
}
|
examples/commonvoice_17_th_asr/data-00000-of-00001.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfd84989250d4b79f4cb4b0ae5028d032e221858d6dab77494a04a8a2336aab4
|
3 |
+
size 44792
|
examples/commonvoice_17_th_asr/dataset_info.json
ADDED
@@ -0,0 +1,164 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"builder_name": "common_voice_17_0",
|
3 |
+
"citation": "@inproceedings{commonvoice:2020,\n author = {Ardila, R. and Branson, M. and Davis, K. and Henretty, M. and Kohler, M. and Meyer, J. and Morais, R. and Saunders, L. and Tyers, F. M. and Weber, G.},\n title = {Common Voice: A Massively-Multilingual Speech Corpus},\n booktitle = {Proceedings of the 12th Conference on Language Resources and Evaluation (LREC 2020)},\n pages = {4211--4215},\n year = 2020\n}\n",
|
4 |
+
"config_name": "th",
|
5 |
+
"dataset_name": "common_voice_17_0",
|
6 |
+
"dataset_size": 271837409,
|
7 |
+
"description": "Common Voice is Mozilla's initiative to help teach machines how real people speak. The dataset currently consists of 20408 validated hours of speech in 124 languages, but more voices and languages are always added.",
|
8 |
+
"download_checksums": {
|
9 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/n_shards.json": {
|
10 |
+
"num_bytes": 17491,
|
11 |
+
"checksum": null
|
12 |
+
},
|
13 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/train/th_train_0.tar": {
|
14 |
+
"num_bytes": 838082560,
|
15 |
+
"checksum": null
|
16 |
+
},
|
17 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/dev/th_dev_0.tar": {
|
18 |
+
"num_bytes": 323399680,
|
19 |
+
"checksum": null
|
20 |
+
},
|
21 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/test/th_test_0.tar": {
|
22 |
+
"num_bytes": 335851520,
|
23 |
+
"checksum": null
|
24 |
+
},
|
25 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/other/th_other_0.tar": {
|
26 |
+
"num_bytes": 1147064320,
|
27 |
+
"checksum": null
|
28 |
+
},
|
29 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/other/th_other_1.tar": {
|
30 |
+
"num_bytes": 1057300480,
|
31 |
+
"checksum": null
|
32 |
+
},
|
33 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/other/th_other_2.tar": {
|
34 |
+
"num_bytes": 943237120,
|
35 |
+
"checksum": null
|
36 |
+
},
|
37 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/other/th_other_3.tar": {
|
38 |
+
"num_bytes": 837079040,
|
39 |
+
"checksum": null
|
40 |
+
},
|
41 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/other/th_other_4.tar": {
|
42 |
+
"num_bytes": 1055385600,
|
43 |
+
"checksum": null
|
44 |
+
},
|
45 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/other/th_other_5.tar": {
|
46 |
+
"num_bytes": 176015360,
|
47 |
+
"checksum": null
|
48 |
+
},
|
49 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/invalidated/th_invalidated_0.tar": {
|
50 |
+
"num_bytes": 287416320,
|
51 |
+
"checksum": null
|
52 |
+
},
|
53 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/validated/th_validated_0.tar": {
|
54 |
+
"num_bytes": 1191843840,
|
55 |
+
"checksum": null
|
56 |
+
},
|
57 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/validated/th_validated_1.tar": {
|
58 |
+
"num_bytes": 1079930880,
|
59 |
+
"checksum": null
|
60 |
+
},
|
61 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/validated/th_validated_2.tar": {
|
62 |
+
"num_bytes": 1014691840,
|
63 |
+
"checksum": null
|
64 |
+
},
|
65 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/th/validated/th_validated_3.tar": {
|
66 |
+
"num_bytes": 744366080,
|
67 |
+
"checksum": null
|
68 |
+
},
|
69 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/th/train.tsv": {
|
70 |
+
"num_bytes": 11337047,
|
71 |
+
"checksum": null
|
72 |
+
},
|
73 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/th/dev.tsv": {
|
74 |
+
"num_bytes": 3803758,
|
75 |
+
"checksum": null
|
76 |
+
},
|
77 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/th/test.tsv": {
|
78 |
+
"num_bytes": 3702050,
|
79 |
+
"checksum": null
|
80 |
+
},
|
81 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/th/other.tsv": {
|
82 |
+
"num_bytes": 71870764,
|
83 |
+
"checksum": null
|
84 |
+
},
|
85 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/th/invalidated.tsv": {
|
86 |
+
"num_bytes": 3301372,
|
87 |
+
"checksum": null
|
88 |
+
},
|
89 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/th/validated.tsv": {
|
90 |
+
"num_bytes": 50649618,
|
91 |
+
"checksum": null
|
92 |
+
}
|
93 |
+
},
|
94 |
+
"download_size": 11176346740,
|
95 |
+
"features": {
|
96 |
+
"context": {
|
97 |
+
"sampling_rate": 16000,
|
98 |
+
"_type": "Audio"
|
99 |
+
},
|
100 |
+
"instruction": {
|
101 |
+
"dtype": "string",
|
102 |
+
"_type": "Value"
|
103 |
+
},
|
104 |
+
"answer": {
|
105 |
+
"dtype": "string",
|
106 |
+
"_type": "Value"
|
107 |
+
},
|
108 |
+
"audio_length": {
|
109 |
+
"dtype": "float64",
|
110 |
+
"_type": "Value"
|
111 |
+
},
|
112 |
+
"language": {
|
113 |
+
"dtype": "string",
|
114 |
+
"_type": "Value"
|
115 |
+
}
|
116 |
+
},
|
117 |
+
"homepage": "https://commonvoice.mozilla.org/en/datasets",
|
118 |
+
"license": "https://creativecommons.org/publicdomain/zero/1.0/",
|
119 |
+
"size_in_bytes": 11448184149,
|
120 |
+
"splits": {
|
121 |
+
"train": {
|
122 |
+
"name": "train",
|
123 |
+
"num_bytes": 21220759,
|
124 |
+
"num_examples": 32823,
|
125 |
+
"dataset_name": "common_voice_17_0"
|
126 |
+
},
|
127 |
+
"validation": {
|
128 |
+
"name": "validation",
|
129 |
+
"num_bytes": 7084499,
|
130 |
+
"num_examples": 11042,
|
131 |
+
"dataset_name": "common_voice_17_0"
|
132 |
+
},
|
133 |
+
"test": {
|
134 |
+
"name": "test",
|
135 |
+
"num_bytes": 7004874,
|
136 |
+
"num_examples": 11042,
|
137 |
+
"dataset_name": "common_voice_17_0"
|
138 |
+
},
|
139 |
+
"other": {
|
140 |
+
"name": "other",
|
141 |
+
"num_bytes": 134183952,
|
142 |
+
"num_examples": 206935,
|
143 |
+
"dataset_name": "common_voice_17_0"
|
144 |
+
},
|
145 |
+
"invalidated": {
|
146 |
+
"name": "invalidated",
|
147 |
+
"num_bytes": 6202988,
|
148 |
+
"num_examples": 9267,
|
149 |
+
"dataset_name": "common_voice_17_0"
|
150 |
+
},
|
151 |
+
"validated": {
|
152 |
+
"name": "validated",
|
153 |
+
"num_bytes": 96140337,
|
154 |
+
"num_examples": 147160,
|
155 |
+
"dataset_name": "common_voice_17_0"
|
156 |
+
}
|
157 |
+
},
|
158 |
+
"version": {
|
159 |
+
"version_str": "17.0.0",
|
160 |
+
"major": 17,
|
161 |
+
"minor": 0,
|
162 |
+
"patch": 0
|
163 |
+
}
|
164 |
+
}
|
examples/commonvoice_17_th_asr/state.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_data_files": [
|
3 |
+
{
|
4 |
+
"filename": "data-00000-of-00001.arrow"
|
5 |
+
}
|
6 |
+
],
|
7 |
+
"_fingerprint": "4b0c4a31664c7d67",
|
8 |
+
"_format_columns": null,
|
9 |
+
"_format_kwargs": {},
|
10 |
+
"_format_type": null,
|
11 |
+
"_output_all_columns": false,
|
12 |
+
"_split": null
|
13 |
+
}
|
examples/commonvoice_17_vi_asr/data-00000-of-00001.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4249665ed76ad59af6281a9c0bacc6862d8cd750218637cd8570bc9d89002751
|
3 |
+
size 39104
|
examples/commonvoice_17_vi_asr/dataset_info.json
ADDED
@@ -0,0 +1,132 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"builder_name": "common_voice_17_0",
|
3 |
+
"citation": "@inproceedings{commonvoice:2020,\n author = {Ardila, R. and Branson, M. and Davis, K. and Henretty, M. and Kohler, M. and Meyer, J. and Morais, R. and Saunders, L. and Tyers, F. M. and Weber, G.},\n title = {Common Voice: A Massively-Multilingual Speech Corpus},\n booktitle = {Proceedings of the 12th Conference on Language Resources and Evaluation (LREC 2020)},\n pages = {4211--4215},\n year = 2020\n}\n",
|
4 |
+
"config_name": "vi",
|
5 |
+
"dataset_name": "common_voice_17_0",
|
6 |
+
"dataset_size": 12705254,
|
7 |
+
"description": "Common Voice is Mozilla's initiative to help teach machines how real people speak. The dataset currently consists of 20408 validated hours of speech in 124 languages, but more voices and languages are always added.",
|
8 |
+
"download_checksums": {
|
9 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/n_shards.json": {
|
10 |
+
"num_bytes": 17491,
|
11 |
+
"checksum": null
|
12 |
+
},
|
13 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/vi/train/vi_train_0.tar": {
|
14 |
+
"num_bytes": 69468160,
|
15 |
+
"checksum": null
|
16 |
+
},
|
17 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/vi/dev/vi_dev_0.tar": {
|
18 |
+
"num_bytes": 14479360,
|
19 |
+
"checksum": null
|
20 |
+
},
|
21 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/vi/test/vi_test_0.tar": {
|
22 |
+
"num_bytes": 34488320,
|
23 |
+
"checksum": null
|
24 |
+
},
|
25 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/vi/other/vi_other_0.tar": {
|
26 |
+
"num_bytes": 276172800,
|
27 |
+
"checksum": null
|
28 |
+
},
|
29 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/vi/invalidated/vi_invalidated_0.tar": {
|
30 |
+
"num_bytes": 11345920,
|
31 |
+
"checksum": null
|
32 |
+
},
|
33 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/audio/vi/validated/vi_validated_0.tar": {
|
34 |
+
"num_bytes": 144384000,
|
35 |
+
"checksum": null
|
36 |
+
},
|
37 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/vi/train.tsv": {
|
38 |
+
"num_bytes": 688189,
|
39 |
+
"checksum": null
|
40 |
+
},
|
41 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/vi/dev.tsv": {
|
42 |
+
"num_bytes": 184767,
|
43 |
+
"checksum": null
|
44 |
+
},
|
45 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/vi/test.tsv": {
|
46 |
+
"num_bytes": 373370,
|
47 |
+
"checksum": null
|
48 |
+
},
|
49 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/vi/other.tsv": {
|
50 |
+
"num_bytes": 3384906,
|
51 |
+
"checksum": null
|
52 |
+
},
|
53 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/vi/invalidated.tsv": {
|
54 |
+
"num_bytes": 111099,
|
55 |
+
"checksum": null
|
56 |
+
},
|
57 |
+
"https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0/resolve/main/transcript/vi/validated.tsv": {
|
58 |
+
"num_bytes": 1521796,
|
59 |
+
"checksum": null
|
60 |
+
}
|
61 |
+
},
|
62 |
+
"download_size": 556620178,
|
63 |
+
"features": {
|
64 |
+
"context": {
|
65 |
+
"sampling_rate": 16000,
|
66 |
+
"_type": "Audio"
|
67 |
+
},
|
68 |
+
"instruction": {
|
69 |
+
"dtype": "string",
|
70 |
+
"_type": "Value"
|
71 |
+
},
|
72 |
+
"answer": {
|
73 |
+
"dtype": "string",
|
74 |
+
"_type": "Value"
|
75 |
+
},
|
76 |
+
"audio_length": {
|
77 |
+
"dtype": "float64",
|
78 |
+
"_type": "Value"
|
79 |
+
},
|
80 |
+
"language": {
|
81 |
+
"dtype": "string",
|
82 |
+
"_type": "Value"
|
83 |
+
}
|
84 |
+
},
|
85 |
+
"homepage": "https://commonvoice.mozilla.org/en/datasets",
|
86 |
+
"license": "https://creativecommons.org/publicdomain/zero/1.0/",
|
87 |
+
"size_in_bytes": 569325432,
|
88 |
+
"splits": {
|
89 |
+
"train": {
|
90 |
+
"name": "train",
|
91 |
+
"num_bytes": 1380061,
|
92 |
+
"num_examples": 2298,
|
93 |
+
"dataset_name": "common_voice_17_0"
|
94 |
+
},
|
95 |
+
"validation": {
|
96 |
+
"name": "validation",
|
97 |
+
"num_bytes": 375111,
|
98 |
+
"num_examples": 641,
|
99 |
+
"dataset_name": "common_voice_17_0"
|
100 |
+
},
|
101 |
+
"test": {
|
102 |
+
"name": "test",
|
103 |
+
"num_bytes": 754342,
|
104 |
+
"num_examples": 1274,
|
105 |
+
"dataset_name": "common_voice_17_0"
|
106 |
+
},
|
107 |
+
"other": {
|
108 |
+
"name": "other",
|
109 |
+
"num_bytes": 6857667,
|
110 |
+
"num_examples": 11533,
|
111 |
+
"dataset_name": "common_voice_17_0"
|
112 |
+
},
|
113 |
+
"invalidated": {
|
114 |
+
"name": "invalidated",
|
115 |
+
"num_bytes": 229034,
|
116 |
+
"num_examples": 377,
|
117 |
+
"dataset_name": "common_voice_17_0"
|
118 |
+
},
|
119 |
+
"validated": {
|
120 |
+
"name": "validated",
|
121 |
+
"num_bytes": 3109039,
|
122 |
+
"num_examples": 5135,
|
123 |
+
"dataset_name": "common_voice_17_0"
|
124 |
+
}
|
125 |
+
},
|
126 |
+
"version": {
|
127 |
+
"version_str": "17.0.0",
|
128 |
+
"major": 17,
|
129 |
+
"minor": 0,
|
130 |
+
"patch": 0
|
131 |
+
}
|
132 |
+
}
|
examples/commonvoice_17_vi_asr/state.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_data_files": [
|
3 |
+
{
|
4 |
+
"filename": "data-00000-of-00001.arrow"
|
5 |
+
}
|
6 |
+
],
|
7 |
+
"_fingerprint": "6ce07a66a0e6d7b0",
|
8 |
+
"_format_columns": null,
|
9 |
+
"_format_kwargs": {},
|
10 |
+
"_format_type": null,
|
11 |
+
"_output_all_columns": false,
|
12 |
+
"_split": null
|
13 |
+
}
|
examples/commonvoice_zh_asr/data-00000-of-00001.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:951bb47527709c895c17e6dac4a4a43b2a141b16babd39e56d9199deaec72eb5
|
3 |
+
size 68224
|
examples/commonvoice_zh_asr/dataset_info.json
ADDED
@@ -0,0 +1,182 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"builder_name": "common_voice_16_0",
|
3 |
+
"citation": "@inproceedings{commonvoice:2020,\n author = {Ardila, R. and Branson, M. and Davis, K. and Henretty, M. and Kohler, M. and Meyer, J. and Morais, R. and Saunders, L. and Tyers, F. M. and Weber, G.},\n title = {Common Voice: A Massively-Multilingual Speech Corpus},\n booktitle = {Proceedings of the 12th Conference on Language Resources and Evaluation (LREC 2020)},\n pages = {4211--4215},\n year = 2020\n}\n",
|
4 |
+
"config_name": "zh-CN",
|
5 |
+
"dataset_name": "common_voice_16_0",
|
6 |
+
"dataset_size": 423983727,
|
7 |
+
"description": "Common Voice is Mozilla's initiative to help teach machines how real people speak. The dataset currently consists of 19159 validated hours of speech in 119 languages, but more voices and languages are always added.",
|
8 |
+
"download_checksums": {
|
9 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/n_shards.json": {
|
10 |
+
"num_bytes": 17487,
|
11 |
+
"checksum": null
|
12 |
+
},
|
13 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/train/zh-CN_train_0.tar": {
|
14 |
+
"num_bytes": 1157220864,
|
15 |
+
"checksum": null
|
16 |
+
},
|
17 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/dev/zh-CN_dev_0.tar": {
|
18 |
+
"num_bytes": 436442624,
|
19 |
+
"checksum": null
|
20 |
+
},
|
21 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/test/zh-CN_test_0.tar": {
|
22 |
+
"num_bytes": 506296320,
|
23 |
+
"checksum": null
|
24 |
+
},
|
25 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_0.tar": {
|
26 |
+
"num_bytes": 1252570624,
|
27 |
+
"checksum": null
|
28 |
+
},
|
29 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_1.tar": {
|
30 |
+
"num_bytes": 1216365056,
|
31 |
+
"checksum": null
|
32 |
+
},
|
33 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_2.tar": {
|
34 |
+
"num_bytes": 1057693696,
|
35 |
+
"checksum": null
|
36 |
+
},
|
37 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_3.tar": {
|
38 |
+
"num_bytes": 1037878784,
|
39 |
+
"checksum": null
|
40 |
+
},
|
41 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_4.tar": {
|
42 |
+
"num_bytes": 1006488064,
|
43 |
+
"checksum": null
|
44 |
+
},
|
45 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_5.tar": {
|
46 |
+
"num_bytes": 951297024,
|
47 |
+
"checksum": null
|
48 |
+
},
|
49 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_6.tar": {
|
50 |
+
"num_bytes": 1054305280,
|
51 |
+
"checksum": null
|
52 |
+
},
|
53 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_7.tar": {
|
54 |
+
"num_bytes": 1079122944,
|
55 |
+
"checksum": null
|
56 |
+
},
|
57 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_8.tar": {
|
58 |
+
"num_bytes": 1057605632,
|
59 |
+
"checksum": null
|
60 |
+
},
|
61 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_9.tar": {
|
62 |
+
"num_bytes": 1054744064,
|
63 |
+
"checksum": null
|
64 |
+
},
|
65 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_10.tar": {
|
66 |
+
"num_bytes": 1037184512,
|
67 |
+
"checksum": null
|
68 |
+
},
|
69 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_11.tar": {
|
70 |
+
"num_bytes": 1081821184,
|
71 |
+
"checksum": null
|
72 |
+
},
|
73 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_12.tar": {
|
74 |
+
"num_bytes": 1144596992,
|
75 |
+
"checksum": null
|
76 |
+
},
|
77 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_13.tar": {
|
78 |
+
"num_bytes": 1211527680,
|
79 |
+
"checksum": null
|
80 |
+
},
|
81 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_14.tar": {
|
82 |
+
"num_bytes": 1190928384,
|
83 |
+
"checksum": null
|
84 |
+
},
|
85 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/other/zh-CN_other_15.tar": {
|
86 |
+
"num_bytes": 299709952,
|
87 |
+
"checksum": null
|
88 |
+
},
|
89 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/invalidated/zh-CN_invalidated_0.tar": {
|
90 |
+
"num_bytes": 1000983552,
|
91 |
+
"checksum": null
|
92 |
+
},
|
93 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/audio/zh-CN/invalidated/zh-CN_invalidated_1.tar": {
|
94 |
+
"num_bytes": 416471552,
|
95 |
+
"checksum": null
|
96 |
+
},
|
97 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/transcript/zh-CN/train.tsv": {
|
98 |
+
"num_bytes": 7373507,
|
99 |
+
"checksum": null
|
100 |
+
},
|
101 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/transcript/zh-CN/dev.tsv": {
|
102 |
+
"num_bytes": 2567399,
|
103 |
+
"checksum": null
|
104 |
+
},
|
105 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/transcript/zh-CN/test.tsv": {
|
106 |
+
"num_bytes": 2457920,
|
107 |
+
"checksum": null
|
108 |
+
},
|
109 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/transcript/zh-CN/other.tsv": {
|
110 |
+
"num_bytes": 137605043,
|
111 |
+
"checksum": null
|
112 |
+
},
|
113 |
+
"https://huggingface.co/datasets/fsicoli/common_voice_16_0/resolve/main/transcript/zh-CN/invalidated.tsv": {
|
114 |
+
"num_bytes": 13622503,
|
115 |
+
"checksum": null
|
116 |
+
}
|
117 |
+
},
|
118 |
+
"download_size": 20414898643,
|
119 |
+
"features": {
|
120 |
+
"context": {
|
121 |
+
"sampling_rate": 16000,
|
122 |
+
"_type": "Audio"
|
123 |
+
},
|
124 |
+
"instruction": {
|
125 |
+
"dtype": "string",
|
126 |
+
"_type": "Value"
|
127 |
+
},
|
128 |
+
"answer": {
|
129 |
+
"dtype": "string",
|
130 |
+
"_type": "Value"
|
131 |
+
},
|
132 |
+
"audio_length": {
|
133 |
+
"dtype": "float64",
|
134 |
+
"_type": "Value"
|
135 |
+
},
|
136 |
+
"language": {
|
137 |
+
"dtype": "string",
|
138 |
+
"_type": "Value"
|
139 |
+
}
|
140 |
+
},
|
141 |
+
"homepage": "https://commonvoice.mozilla.org/en/datasets",
|
142 |
+
"license": "https://creativecommons.org/publicdomain/zero/1.0/",
|
143 |
+
"size_in_bytes": 20838882370,
|
144 |
+
"splits": {
|
145 |
+
"train": {
|
146 |
+
"name": "train",
|
147 |
+
"num_bytes": 17963235,
|
148 |
+
"num_examples": 29406,
|
149 |
+
"dataset_name": "common_voice_16_0"
|
150 |
+
},
|
151 |
+
"validation": {
|
152 |
+
"name": "validation",
|
153 |
+
"num_bytes": 6351483,
|
154 |
+
"num_examples": 10626,
|
155 |
+
"dataset_name": "common_voice_16_0"
|
156 |
+
},
|
157 |
+
"test": {
|
158 |
+
"name": "test",
|
159 |
+
"num_bytes": 6263265,
|
160 |
+
"num_examples": 10626,
|
161 |
+
"dataset_name": "common_voice_16_0"
|
162 |
+
},
|
163 |
+
"other": {
|
164 |
+
"name": "other",
|
165 |
+
"num_bytes": 358056452,
|
166 |
+
"num_examples": 610981,
|
167 |
+
"dataset_name": "common_voice_16_0"
|
168 |
+
},
|
169 |
+
"invalidated": {
|
170 |
+
"name": "invalidated",
|
171 |
+
"num_bytes": 35349292,
|
172 |
+
"num_examples": 58386,
|
173 |
+
"dataset_name": "common_voice_16_0"
|
174 |
+
}
|
175 |
+
},
|
176 |
+
"version": {
|
177 |
+
"version_str": "15.0.0",
|
178 |
+
"major": 15,
|
179 |
+
"minor": 0,
|
180 |
+
"patch": 0
|
181 |
+
}
|
182 |
+
}
|
examples/commonvoice_zh_asr/state.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_data_files": [
|
3 |
+
{
|
4 |
+
"filename": "data-00000-of-00001.arrow"
|
5 |
+
}
|
6 |
+
],
|
7 |
+
"_fingerprint": "41452271d4051e81",
|
8 |
+
"_format_columns": null,
|
9 |
+
"_format_kwargs": {},
|
10 |
+
"_format_type": null,
|
11 |
+
"_output_all_columns": false,
|
12 |
+
"_split": null
|
13 |
+
}
|
examples/covost2_en_id_test/data-00000-of-00001.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d4bfb1098a59bf75aab6b9b824141808bb48160787b182b03fabf4a56527a9e
|
3 |
+
size 56496
|
examples/covost2_en_id_test/dataset_info.json
ADDED
@@ -0,0 +1,73 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"builder_name": "parquet",
|
3 |
+
"citation": "",
|
4 |
+
"config_name": "default",
|
5 |
+
"dataset_name": "covost2_en_id_test_v1",
|
6 |
+
"dataset_size": 2842304040,
|
7 |
+
"description": "",
|
8 |
+
"download_checksums": {
|
9 |
+
"hf://datasets/AudioLLMs/covost2_en_id_test_v1@51a4b1517f07e1dcf9180aa270f264961165cab3/data/test-00000-of-00006.parquet": {
|
10 |
+
"num_bytes": 421383822,
|
11 |
+
"checksum": null
|
12 |
+
},
|
13 |
+
"hf://datasets/AudioLLMs/covost2_en_id_test_v1@51a4b1517f07e1dcf9180aa270f264961165cab3/data/test-00001-of-00006.parquet": {
|
14 |
+
"num_bytes": 430366828,
|
15 |
+
"checksum": null
|
16 |
+
},
|
17 |
+
"hf://datasets/AudioLLMs/covost2_en_id_test_v1@51a4b1517f07e1dcf9180aa270f264961165cab3/data/test-00002-of-00006.parquet": {
|
18 |
+
"num_bytes": 423203231,
|
19 |
+
"checksum": null
|
20 |
+
},
|
21 |
+
"hf://datasets/AudioLLMs/covost2_en_id_test_v1@51a4b1517f07e1dcf9180aa270f264961165cab3/data/test-00003-of-00006.parquet": {
|
22 |
+
"num_bytes": 420946330,
|
23 |
+
"checksum": null
|
24 |
+
},
|
25 |
+
"hf://datasets/AudioLLMs/covost2_en_id_test_v1@51a4b1517f07e1dcf9180aa270f264961165cab3/data/test-00004-of-00006.parquet": {
|
26 |
+
"num_bytes": 419734090,
|
27 |
+
"checksum": null
|
28 |
+
},
|
29 |
+
"hf://datasets/AudioLLMs/covost2_en_id_test_v1@51a4b1517f07e1dcf9180aa270f264961165cab3/data/test-00005-of-00006.parquet": {
|
30 |
+
"num_bytes": 419963769,
|
31 |
+
"checksum": null
|
32 |
+
}
|
33 |
+
},
|
34 |
+
"download_size": 2535598070,
|
35 |
+
"features": {
|
36 |
+
"context": {
|
37 |
+
"_type": "Audio"
|
38 |
+
},
|
39 |
+
"instruction": {
|
40 |
+
"dtype": "string",
|
41 |
+
"_type": "Value"
|
42 |
+
},
|
43 |
+
"answer": {
|
44 |
+
"dtype": "string",
|
45 |
+
"_type": "Value"
|
46 |
+
}
|
47 |
+
},
|
48 |
+
"homepage": "",
|
49 |
+
"license": "",
|
50 |
+
"size_in_bytes": 5377902110,
|
51 |
+
"splits": {
|
52 |
+
"test": {
|
53 |
+
"name": "test",
|
54 |
+
"num_bytes": 2842304040,
|
55 |
+
"num_examples": 15531,
|
56 |
+
"shard_lengths": [
|
57 |
+
2789,
|
58 |
+
2789,
|
59 |
+
2789,
|
60 |
+
2788,
|
61 |
+
2788,
|
62 |
+
1588
|
63 |
+
],
|
64 |
+
"dataset_name": "covost2_en_id_test_v1"
|
65 |
+
}
|
66 |
+
},
|
67 |
+
"version": {
|
68 |
+
"version_str": "0.0.0",
|
69 |
+
"major": 0,
|
70 |
+
"minor": 0,
|
71 |
+
"patch": 0
|
72 |
+
}
|
73 |
+
}
|
examples/covost2_en_id_test/state.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_data_files": [
|
3 |
+
{
|
4 |
+
"filename": "data-00000-of-00001.arrow"
|
5 |
+
}
|
6 |
+
],
|
7 |
+
"_fingerprint": "f755c8fc2cb9504a",
|
8 |
+
"_format_columns": null,
|
9 |
+
"_format_kwargs": {},
|
10 |
+
"_format_type": null,
|
11 |
+
"_output_all_columns": false,
|
12 |
+
"_split": null
|
13 |
+
}
|
examples/covost2_en_ta_test/data-00000-of-00001.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89aa8cee7fa6754a1491ca48e31162126a808e07bca8731ecf2949bc183dd20f
|
3 |
+
size 58088
|
examples/covost2_en_ta_test/dataset_info.json
ADDED
@@ -0,0 +1,73 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"builder_name": "parquet",
|
3 |
+
"citation": "",
|
4 |
+
"config_name": "default",
|
5 |
+
"dataset_name": "covost2_en_ta_test_v1",
|
6 |
+
"dataset_size": 2844002846,
|
7 |
+
"description": "",
|
8 |
+
"download_checksums": {
|
9 |
+
"hf://datasets/AudioLLMs/covost2_en_ta_test_v1@23c23a71d698faf6c940e18753ade03acbcef86b/data/test-00000-of-00006.parquet": {
|
10 |
+
"num_bytes": 421472102,
|
11 |
+
"checksum": null
|
12 |
+
},
|
13 |
+
"hf://datasets/AudioLLMs/covost2_en_ta_test_v1@23c23a71d698faf6c940e18753ade03acbcef86b/data/test-00001-of-00006.parquet": {
|
14 |
+
"num_bytes": 430453377,
|
15 |
+
"checksum": null
|
16 |
+
},
|
17 |
+
"hf://datasets/AudioLLMs/covost2_en_ta_test_v1@23c23a71d698faf6c940e18753ade03acbcef86b/data/test-00002-of-00006.parquet": {
|
18 |
+
"num_bytes": 423289725,
|
19 |
+
"checksum": null
|
20 |
+
},
|
21 |
+
"hf://datasets/AudioLLMs/covost2_en_ta_test_v1@23c23a71d698faf6c940e18753ade03acbcef86b/data/test-00003-of-00006.parquet": {
|
22 |
+
"num_bytes": 421032929,
|
23 |
+
"checksum": null
|
24 |
+
},
|
25 |
+
"hf://datasets/AudioLLMs/covost2_en_ta_test_v1@23c23a71d698faf6c940e18753ade03acbcef86b/data/test-00004-of-00006.parquet": {
|
26 |
+
"num_bytes": 419820665,
|
27 |
+
"checksum": null
|
28 |
+
},
|
29 |
+
"hf://datasets/AudioLLMs/covost2_en_ta_test_v1@23c23a71d698faf6c940e18753ade03acbcef86b/data/test-00005-of-00006.parquet": {
|
30 |
+
"num_bytes": 420052504,
|
31 |
+
"checksum": null
|
32 |
+
}
|
33 |
+
},
|
34 |
+
"download_size": 2536121302,
|
35 |
+
"features": {
|
36 |
+
"context": {
|
37 |
+
"_type": "Audio"
|
38 |
+
},
|
39 |
+
"instruction": {
|
40 |
+
"dtype": "string",
|
41 |
+
"_type": "Value"
|
42 |
+
},
|
43 |
+
"answer": {
|
44 |
+
"dtype": "string",
|
45 |
+
"_type": "Value"
|
46 |
+
}
|
47 |
+
},
|
48 |
+
"homepage": "",
|
49 |
+
"license": "",
|
50 |
+
"size_in_bytes": 5380124148,
|
51 |
+
"splits": {
|
52 |
+
"test": {
|
53 |
+
"name": "test",
|
54 |
+
"num_bytes": 2844002846,
|
55 |
+
"num_examples": 15531,
|
56 |
+
"shard_lengths": [
|
57 |
+
2789,
|
58 |
+
2789,
|
59 |
+
2789,
|
60 |
+
2788,
|
61 |
+
2788,
|
62 |
+
1588
|
63 |
+
],
|
64 |
+
"dataset_name": "covost2_en_ta_test_v1"
|
65 |
+
}
|
66 |
+
},
|
67 |
+
"version": {
|
68 |
+
"version_str": "0.0.0",
|
69 |
+
"major": 0,
|
70 |
+
"minor": 0,
|
71 |
+
"patch": 0
|
72 |
+
}
|
73 |
+
}
|
examples/covost2_en_ta_test/state.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_data_files": [
|
3 |
+
{
|
4 |
+
"filename": "data-00000-of-00001.arrow"
|
5 |
+
}
|
6 |
+
],
|
7 |
+
"_fingerprint": "fe170901fd58bb52",
|
8 |
+
"_format_columns": null,
|
9 |
+
"_format_kwargs": {},
|
10 |
+
"_format_type": null,
|
11 |
+
"_output_all_columns": false,
|
12 |
+
"_split": null
|
13 |
+
}
|
examples/covost2_en_zh_test/data-00000-of-00001.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aca2fa905173efcf428fd779b4e74ff132b8bab979f925e75ad7ff8b9b19aaa8
|
3 |
+
size 40016
|
examples/covost2_en_zh_test/dataset_info.json
ADDED
@@ -0,0 +1,73 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"builder_name": "parquet",
|
3 |
+
"citation": "",
|
4 |
+
"config_name": "default",
|
5 |
+
"dataset_name": "covost2_en_zh_test_v1",
|
6 |
+
"dataset_size": 2842110316,
|
7 |
+
"description": "",
|
8 |
+
"download_checksums": {
|
9 |
+
"hf://datasets/AudioLLMs/covost2_en_zh_test_v1@6fe92d7fabaee215b078b022abbe8959280f3187/data/test-00000-of-00006.parquet": {
|
10 |
+
"num_bytes": 421376507,
|
11 |
+
"checksum": null
|
12 |
+
},
|
13 |
+
"hf://datasets/AudioLLMs/covost2_en_zh_test_v1@6fe92d7fabaee215b078b022abbe8959280f3187/data/test-00001-of-00006.parquet": {
|
14 |
+
"num_bytes": 430362096,
|
15 |
+
"checksum": null
|
16 |
+
},
|
17 |
+
"hf://datasets/AudioLLMs/covost2_en_zh_test_v1@6fe92d7fabaee215b078b022abbe8959280f3187/data/test-00002-of-00006.parquet": {
|
18 |
+
"num_bytes": 423196814,
|
19 |
+
"checksum": null
|
20 |
+
},
|
21 |
+
"hf://datasets/AudioLLMs/covost2_en_zh_test_v1@6fe92d7fabaee215b078b022abbe8959280f3187/data/test-00003-of-00006.parquet": {
|
22 |
+
"num_bytes": 420938958,
|
23 |
+
"checksum": null
|
24 |
+
},
|
25 |
+
"hf://datasets/AudioLLMs/covost2_en_zh_test_v1@6fe92d7fabaee215b078b022abbe8959280f3187/data/test-00004-of-00006.parquet": {
|
26 |
+
"num_bytes": 419730286,
|
27 |
+
"checksum": null
|
28 |
+
},
|
29 |
+
"hf://datasets/AudioLLMs/covost2_en_zh_test_v1@6fe92d7fabaee215b078b022abbe8959280f3187/data/test-00005-of-00006.parquet": {
|
30 |
+
"num_bytes": 419958145,
|
31 |
+
"checksum": null
|
32 |
+
}
|
33 |
+
},
|
34 |
+
"download_size": 2535562806,
|
35 |
+
"features": {
|
36 |
+
"context": {
|
37 |
+
"_type": "Audio"
|
38 |
+
},
|
39 |
+
"instruction": {
|
40 |
+
"dtype": "string",
|
41 |
+
"_type": "Value"
|
42 |
+
},
|
43 |
+
"answer": {
|
44 |
+
"dtype": "string",
|
45 |
+
"_type": "Value"
|
46 |
+
}
|
47 |
+
},
|
48 |
+
"homepage": "",
|
49 |
+
"license": "",
|
50 |
+
"size_in_bytes": 5377673122,
|
51 |
+
"splits": {
|
52 |
+
"test": {
|
53 |
+
"name": "test",
|
54 |
+
"num_bytes": 2842110316,
|
55 |
+
"num_examples": 15531,
|
56 |
+
"shard_lengths": [
|
57 |
+
2789,
|
58 |
+
2789,
|
59 |
+
2789,
|
60 |
+
2788,
|
61 |
+
2788,
|
62 |
+
1588
|
63 |
+
],
|
64 |
+
"dataset_name": "covost2_en_zh_test_v1"
|
65 |
+
}
|
66 |
+
},
|
67 |
+
"version": {
|
68 |
+
"version_str": "0.0.0",
|
69 |
+
"major": 0,
|
70 |
+
"minor": 0,
|
71 |
+
"patch": 0
|
72 |
+
}
|
73 |
+
}
|
examples/covost2_en_zh_test/state.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_data_files": [
|
3 |
+
{
|
4 |
+
"filename": "data-00000-of-00001.arrow"
|
5 |
+
}
|
6 |
+
],
|
7 |
+
"_fingerprint": "7445fef56d00d00b",
|
8 |
+
"_format_columns": null,
|
9 |
+
"_format_kwargs": {},
|
10 |
+
"_format_type": null,
|
11 |
+
"_output_all_columns": false,
|
12 |
+
"_split": null
|
13 |
+
}
|
examples/covost2_id_en_test/data-00000-of-00001.arrow
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:573589410f93a7667f83d37bd30b472069e7446d2d5e05aa98fc4138b0fd316b
|
3 |
+
size 50736
|
examples/covost2_id_en_test/dataset_info.json
ADDED
@@ -0,0 +1,45 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"builder_name": "parquet",
|
3 |
+
"citation": "",
|
4 |
+
"config_name": "default",
|
5 |
+
"dataset_name": "covost2_id_en_test_v1",
|
6 |
+
"dataset_size": 105217105,
|
7 |
+
"description": "",
|
8 |
+
"download_checksums": {
|
9 |
+
"hf://datasets/AudioLLMs/covost2_id_en_test_v1@3998e50bec6eefdae5b38278238c359acb583f4c/data/test-00000-of-00001.parquet": {
|
10 |
+
"num_bytes": 100225392,
|
11 |
+
"checksum": null
|
12 |
+
}
|
13 |
+
},
|
14 |
+
"download_size": 100225392,
|
15 |
+
"features": {
|
16 |
+
"context": {
|
17 |
+
"_type": "Audio"
|
18 |
+
},
|
19 |
+
"instruction": {
|
20 |
+
"dtype": "string",
|
21 |
+
"_type": "Value"
|
22 |
+
},
|
23 |
+
"answer": {
|
24 |
+
"dtype": "string",
|
25 |
+
"_type": "Value"
|
26 |
+
}
|
27 |
+
},
|
28 |
+
"homepage": "",
|
29 |
+
"license": "",
|
30 |
+
"size_in_bytes": 205442497,
|
31 |
+
"splits": {
|
32 |
+
"test": {
|
33 |
+
"name": "test",
|
34 |
+
"num_bytes": 105217105,
|
35 |
+
"num_examples": 844,
|
36 |
+
"dataset_name": "covost2_id_en_test_v1"
|
37 |
+
}
|
38 |
+
},
|
39 |
+
"version": {
|
40 |
+
"version_str": "0.0.0",
|
41 |
+
"major": 0,
|
42 |
+
"minor": 0,
|
43 |
+
"patch": 0
|
44 |
+
}
|
45 |
+
}
|