-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathreference_transcripts_metadata.json
More file actions
54 lines (54 loc) · 1.71 KB
/
reference_transcripts_metadata.json
File metadata and controls
54 lines (54 loc) · 1.71 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
{
"benchmark": {
"name": "Voices for Christ Benchmark",
"submission_process": "Submit a pull request that adds a new benchmark_data/<mode> directory with one output file per original filename.",
"task": "speech restoration and denoising",
"version": "0.3.0"
},
"dataset": {
"clip_count": 100,
"clip_duration_seconds": 30,
"distribution_status": "public",
"license_note": "Current working assumption: the source Voices for Christ recordings are pre-1990 and open-domain/public-domain compatible. This should be verified before wider redistribution or downstream commercial reuse.",
"license_status": "assumed_public_domain_unverified",
"name": "Voices for Christ archive excerpts",
"source_format": "mp3",
"splits": [
"public_test"
],
"storage": "git-lfs",
"total_duration_seconds": 3000,
"version": "0.1.0"
},
"reference_transcripts": {
"asr_model": {
"beam_size": 15,
"best_of": 15,
"compute_type": "float16",
"condition_on_previous_text": true,
"device": "cuda",
"device_index": 0,
"download_root": null,
"language": "en",
"model_name": "large-v3",
"patience": 2.0
},
"policy": "Strong-reference decode of benchmark_data/original using a larger ASR model and wider beam than submission scoring."
},
"run": {
"argv": [
"score_asr_wer.py"
],
"file_count": 100,
"package_versions": {
"faster-whisper": "1.2.0",
"numpy": "2.2.6",
"torch": "2.8.0",
"torchaudio": "2.8.0",
"tqdm": "4.67.3"
},
"platform": "Linux-6.5.0-15-generic-x86_64-with-glibc2.35",
"python_version": "3.10.12",
"timestamp_utc": "2026-03-17T22:58:48.810633Z"
}
}