diff --git a/configs/lightning_datamodule/bwe.yaml b/configs/lightning_datamodule/bwe.yaml index cd4d32a..c3306e6 100644 --- a/configs/lightning_datamodule/bwe.yaml +++ b/configs/lightning_datamodule/bwe.yaml @@ -1,7 +1,7 @@ _target_: vibravox.lightning_datamodules.bwe.BWELightningDataModule sample_rate: ${sample_rate} -dataset_name: "Cnam-LMSSC/vibravox2" +dataset_name: "Cnam-LMSSC/vibravox" subset: "speech_clean" sensor: "body_conducted.rigid_in_ear_microphone" collate_strategy: "constant_length-2500-ms" diff --git a/configs/lightning_datamodule/spkv.yaml b/configs/lightning_datamodule/spkv.yaml index d09b485..e4ba056 100644 --- a/configs/lightning_datamodule/spkv.yaml +++ b/configs/lightning_datamodule/spkv.yaml @@ -1,7 +1,7 @@ _target_: vibravox.lightning_datamodules.spkv.SPKVLightningDataModule sample_rate: ${sample_rate} -dataset_name: "Cnam-LMSSC/vibravox2" +dataset_name: "Cnam-LMSSC/vibravox" subset: "speech_clean" pairs: "mixed_gender" # can also be "same_gender" sensor_a: "headset_microphone" diff --git a/configs/lightning_datamodule/stp.yaml b/configs/lightning_datamodule/stp.yaml index 70264c0..6632aaa 100644 --- a/configs/lightning_datamodule/stp.yaml +++ b/configs/lightning_datamodule/stp.yaml @@ -1,7 +1,7 @@ _target_: vibravox.lightning_datamodules.stp.STPLightningDataModule sample_rate: ${sample_rate} -dataset_name: "Cnam-LMSSC/vibravox2" +dataset_name: "Cnam-LMSSC/vibravox" subset: "speech_clean" sensor: "headset_microphone" streaming: False diff --git a/scripts/eben_enhanced_vibravox.py b/scripts/eben_enhanced_vibravox.py index 7dd6199..df66bf0 100644 --- a/scripts/eben_enhanced_vibravox.py +++ b/scripts/eben_enhanced_vibravox.py @@ -12,7 +12,7 @@ resampler = torchaudio.transforms.Resample(orig_freq=48_000, new_freq=16_000) -test_dataset = load_dataset("Cnam-LMSSC/vibravox2", "speech_clean", split="test", streaming=False) +test_dataset = load_dataset("Cnam-LMSSC/vibravox", "speech_clean", split="test", streaming=False) def enhance_audio(sample): diff --git a/scripts/test_all_phonemizers.py b/scripts/test_all_phonemizers.py index 18dd5d6..39e79e4 100644 --- a/scripts/test_all_phonemizers.py +++ b/scripts/test_all_phonemizers.py @@ -23,7 +23,7 @@ SAMPLE_RATE = 16_000 -DATASETS = ["Cnam-LMSSC/vibravox2", "Cnam-LMSSC/vibravox_enhanced_by_EBEN"] +DATASETS = ["Cnam-LMSSC/vibravox", "Cnam-LMSSC/vibravox_enhanced_by_EBEN"] FEATURE_EXTRACTOR = transformers.Wav2Vec2FeatureExtractor() TOKENIZER = transformers.Wav2Vec2CTCTokenizer.from_pretrained("Cnam-LMSSC/vibravox-phonemes-tokenizer") PER = torchmetrics.text.CharErrorRate()