Update batch_confirm_hf.py to load the entire validated dataset instead of a subset.
This commit is contained in:
@@ -14,7 +14,7 @@ from huggingface_hub import HfApi, create_repo
|
|||||||
print("Loading dataset...")
|
print("Loading dataset...")
|
||||||
ds = load_dataset(
|
ds = load_dataset(
|
||||||
"Ashegh-Sad-Warrior/Persian_Common_Voice_17_0",
|
"Ashegh-Sad-Warrior/Persian_Common_Voice_17_0",
|
||||||
split="validated[:5]",
|
split="validated",
|
||||||
streaming=False
|
streaming=False
|
||||||
).cast_column("audio", Audio(sampling_rate=16000))
|
).cast_column("audio", Audio(sampling_rate=16000))
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user