-
Notifications
You must be signed in to change notification settings - Fork 0
/
preprocess.py
36 lines (31 loc) · 924 Bytes
/
preprocess.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
"""
Created on 2022/06/13
@author Sangwoo Han
"""
from typing import Any
import click
from main import cli
from src.dataset.kspon.preprocess import preprocess_data
from src.dataset.kspon.preprocess.character import (
generate_character_script,
)
from src.utils import AttrDict, log_elapsed_time
@cli.command(context_settings={"show_default": True})
@click.option(
"--data-dir",
type=click.Path(exists=True),
default="./data/kspon_speech/original",
help="Data path of original KSponSpeech dataset",
)
@click.option(
"--save-path",
type=click.Path(),
default="./data/kspon_speech/preprocessed",
help="Path to be saved preprocseed data",
)
@log_elapsed_time
def preprocess_kspon(**args: Any):
"""Preprocess KsponSpeech"""
args = AttrDict(args)
audio_paths, transcripts = preprocess_data(args.data_dir)
generate_character_script(audio_paths, transcripts, args.save_path)