Skip to content

Commit

Permalink
updates from main
Browse files Browse the repository at this point in the history
  • Loading branch information
Atticus1806 committed Sep 13, 2023
1 parent 952cb54 commit b870355
Showing 1 changed file with 4 additions and 11 deletions.
15 changes: 4 additions & 11 deletions common/datasets/tedlium2/corpus.py
Original file line number Diff line number Diff line change
Expand Up @@ -28,17 +28,9 @@ def get_bliss_corpus_dict(audio_format: str = "wav", output_prefix: str = "datas
bliss_corpus_dict = download_data_dict(output_prefix=output_prefix).bliss_nist

audio_format_options = {
"wav": {
"output_format": "wav",
"codec": "pcm_s16le",
"recover_duration": False,
},
"ogg": {"output_format": "ogg", "codec": "libvorbis", "recover_duration": False},
"flac": {
"output_format": "flac",
"codec": "flac",
"recover_duration": False,
},
"wav": {"output_format": "wav", "codec": "pcm_s16le"},
"ogg": {"output_format": "ogg", "codec": "libvorbis"},
"flac": {"output_format": "flac", "codec": "flac"},
}

converted_bliss_corpus_dict = {}
Expand All @@ -47,6 +39,7 @@ def get_bliss_corpus_dict(audio_format: str = "wav", output_prefix: str = "datas
bliss_change_encoding_job = BlissChangeEncodingJob(
corpus_file=sph_corpus,
sample_rate=16000,
recover_duration=False,
**audio_format_options[audio_format],
)
bliss_change_encoding_job.add_alias(
Expand Down

0 comments on commit b870355

Please sign in to comment.