Skip to content

Commit 9db84a1

Browse files
authored
Merge pull request #5 from hyhuc0079/hyhuc0079-patch-2
Hyhuc0079 patch 2
2 parents 3849c96 + 13d0844 commit 9db84a1

2 files changed

Lines changed: 12 additions & 10 deletions

File tree

audio_slicer_pre.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@
1313
"--max_sec", "-M", type=int, default=5000, help="Maximum seconds of a slice"
1414
)
1515
parser.add_argument(
16-
"--model_name",
16+
"--dataset_path",
1717
type=str,
1818
default="inputs",
1919
help="Directory of input wav files",
@@ -38,7 +38,7 @@
3838
os.makedirs(folder_path)
3939

4040
# 遍历指定目录下的所有.wav文件
41-
audio_directory = f'{args.model_name}'
41+
audio_directory = f'{args.dataset_path}'
4242
for filename in os.listdir(audio_directory):
4343
file_path = os.path.join(audio_directory, filename)
4444
if os.path.isfile(file_path) and filename.endswith('.wav'):

webui_dataset.py

Lines changed: 10 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -11,21 +11,21 @@
1111

1212

1313
def do_slice(
14-
model_name: str,
14+
dataset_path: str,
1515
min_sec: int,
1616
max_sec: int,
1717
min_silence_dur_ms: int,
1818
):
19-
if model_name == "":
20-
return "Error: 角色名不能为空"
19+
if dataset_path == "":
20+
return "Error: 数据集路径不能为空"
2121
logger.info("Start slicing...")
22-
output_dir = os.path.join(dataset_root, model_name, ".\\wavs")
22+
output_dir = os.path.join(dataset_root, dataset_path, ".\\wavs")
2323

2424

2525
cmd = [
2626
"audio_slicer_pre.py",
27-
"--model_name",
28-
model_name,
27+
"--dataset_path",
28+
dataset_path,
2929
"--min_sec",
3030
str(min_sec),
3131
"--max_sec",
@@ -115,6 +115,8 @@ def do_transcribe_all(
115115
with gr.Blocks(theme="NoCrypt/miku") as app:
116116
gr.Markdown(initial_md)
117117
model_name = gr.Textbox(label="角色名",placeholder="请输入角色名")
118+
##add by hyh 添加一个数据集路径的文本框
119+
dataset_path = gr.Textbox(label="数据集路径",placeholder="设置切割数据集样本路径")
118120

119121
with gr.Accordion("音频素材切割"):
120122
with gr.Row():
@@ -158,7 +160,7 @@ def do_transcribe_all(
158160

159161
slice_button.click(
160162
do_slice,
161-
inputs=[model_name, min_sec, max_sec, min_silence_dur_ms],
163+
inputs=[dataset_path, min_sec, max_sec, min_silence_dur_ms],
162164
outputs=[result1],
163165
)
164166
transcribe_button_whisper.click(
@@ -212,4 +214,4 @@ def do_transcribe_all(
212214
)
213215
args = parser.parse_args()
214216

215-
app.launch(inbrowser=not args.no_autolaunch, server_name=args.server_name)
217+
app.launch(inbrowser=not args.no_autolaunch, server_name=args.server_name, server_port=7971)

0 commit comments

Comments
 (0)