Spaces:
Running
on
Zero
Running
on
Zero
Commit
·
f045a70
1
Parent(s):
8c97255
README.md
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
---
|
| 2 |
-
title: Dhivehi
|
| 3 |
emoji: 📊
|
| 4 |
colorFrom: green
|
| 5 |
colorTo: purple
|
|
|
|
| 1 |
---
|
| 2 |
+
title: Dhivehi TTS Demos
|
| 3 |
emoji: 📊
|
| 4 |
colorFrom: green
|
| 5 |
colorTo: purple
|
app.py
CHANGED
|
@@ -510,19 +510,19 @@ with gr.Blocks(
|
|
| 510 |
|
| 511 |
# Context Generation
|
| 512 |
with gr.TabItem("🎭 Context Generation"):
|
| 513 |
-
gr.Markdown("### Generate speech with
|
| 514 |
|
| 515 |
with gr.Row():
|
| 516 |
with gr.Column():
|
| 517 |
context_text = gr.Textbox(
|
| 518 |
-
label="
|
| 519 |
placeholder="މަންމަ ކިހާއިރެއް ދަރިފުޅުގެ އިންތިޒާރުގަ އިންނަތާ",
|
| 520 |
value="އައިލީޝް އޭނާއަތަށް ލިބުނީ އެންމެ ނުވަ މަހުގަ",
|
| 521 |
lines=2,
|
| 522 |
elem_classes=["dhivehi-text"]
|
| 523 |
)
|
| 524 |
context_audio = gr.Audio(
|
| 525 |
-
label="
|
| 526 |
type="filepath"
|
| 527 |
)
|
| 528 |
target_text = gr.Textbox(
|
|
@@ -574,26 +574,26 @@ with gr.Blocks(
|
|
| 574 |
with gr.Accordion("🎵 Audio Style References", open=False):
|
| 575 |
with gr.Row():
|
| 576 |
with gr.Column():
|
| 577 |
-
gr.Markdown("**Speaker A
|
| 578 |
speaker_a_audio = gr.Audio(
|
| 579 |
type="filepath",
|
| 580 |
label="Speaker A Audio Style"
|
| 581 |
)
|
| 582 |
speaker_a_text = gr.Textbox(
|
| 583 |
-
label="Speaker A
|
| 584 |
lines=2,
|
| 585 |
placeholder="މަންމަ ކިހާއިރެއް ދަރިފުޅުގެ އިންތިޒާރުގަ އިންނަތާ",
|
| 586 |
elem_classes=["dhivehi-text"]
|
| 587 |
)
|
| 588 |
|
| 589 |
with gr.Column():
|
| 590 |
-
gr.Markdown("**Speaker B
|
| 591 |
speaker_b_audio = gr.Audio(
|
| 592 |
type="filepath",
|
| 593 |
-
label="Speaker B
|
| 594 |
)
|
| 595 |
speaker_b_text = gr.Textbox(
|
| 596 |
-
label="Speaker B
|
| 597 |
lines=2,
|
| 598 |
placeholder="މަންމަ ކިހާއިރެއް ދަރިފުޅުގެ އިންތިޒާރުގަ އިންނަތާ",
|
| 599 |
elem_classes=["dhivehi-text"]
|
|
|
|
| 510 |
|
| 511 |
# Context Generation
|
| 512 |
with gr.TabItem("🎭 Context Generation"):
|
| 513 |
+
gr.Markdown("### Generate speech with voice prompt")
|
| 514 |
|
| 515 |
with gr.Row():
|
| 516 |
with gr.Column():
|
| 517 |
context_text = gr.Textbox(
|
| 518 |
+
label="Speaker prompt",
|
| 519 |
placeholder="މަންމަ ކިހާއިރެއް ދަރިފުޅުގެ އިންތިޒާރުގަ އިންނަތާ",
|
| 520 |
value="އައިލީޝް އޭނާއަތަށް ލިބުނީ އެންމެ ނުވަ މަހުގަ",
|
| 521 |
lines=2,
|
| 522 |
elem_classes=["dhivehi-text"]
|
| 523 |
)
|
| 524 |
context_audio = gr.Audio(
|
| 525 |
+
label="Speaker Prompt",
|
| 526 |
type="filepath"
|
| 527 |
)
|
| 528 |
target_text = gr.Textbox(
|
|
|
|
| 574 |
with gr.Accordion("🎵 Audio Style References", open=False):
|
| 575 |
with gr.Row():
|
| 576 |
with gr.Column():
|
| 577 |
+
gr.Markdown("**Speaker A Prompt**")
|
| 578 |
speaker_a_audio = gr.Audio(
|
| 579 |
type="filepath",
|
| 580 |
label="Speaker A Audio Style"
|
| 581 |
)
|
| 582 |
speaker_a_text = gr.Textbox(
|
| 583 |
+
label="Speaker A Prompt Text",
|
| 584 |
lines=2,
|
| 585 |
placeholder="މަންމަ ކިހާއިރެއް ދަރިފުޅުގެ އިންތިޒާރުގަ އިންނަތާ",
|
| 586 |
elem_classes=["dhivehi-text"]
|
| 587 |
)
|
| 588 |
|
| 589 |
with gr.Column():
|
| 590 |
+
gr.Markdown("**Speaker B Prompt**")
|
| 591 |
speaker_b_audio = gr.Audio(
|
| 592 |
type="filepath",
|
| 593 |
+
label="Speaker B Speaker Prompt"
|
| 594 |
)
|
| 595 |
speaker_b_text = gr.Textbox(
|
| 596 |
+
label="Speaker B Speaker Prompt",
|
| 597 |
lines=2,
|
| 598 |
placeholder="މަންމަ ކިހާއިރެއް ދަރިފުޅުގެ އިންތިޒާރުގަ އިންނަތާ",
|
| 599 |
elem_classes=["dhivehi-text"]
|