Spaces:

Dewiin
/

voice_clone

Running

Devin Xie commited on Nov 4, 2024

Commit

d0b52af

•

1 Parent(s): a2f1abf

added sample inputs

Files changed (5) hide show

.gitignore CHANGED Viewed

app.py CHANGED Viewed

@@ -28,14 +28,21 @@ def main():
   title = f"""<h2 align="center" style="font-size: 1.2rem; margin-bottom: 2rem;">Make your favorite characters say anything!</h2>"""
   st.markdown(title, unsafe_allow_html=True)
   # Upload audio file
   uploaded_file = st.file_uploader('Add an audio file of the voice you want to clone...', type=['wav'])
-  if uploaded_file is not None:
-    reference_audio, synthesized_audio = st.columns(2)
-    with reference_audio:
-      st.header('Reference Audio')
-      st.audio(uploaded_file, format='audio/wav')
     # Input text
     text_input = st.text_input('What do you want your character to say? (Alphabet letters only, DO NOT INCLUDE PUNCTUATION)')
@@ -44,11 +51,10 @@ def main():
       if text_input:
         try:
           with st.spinner('Synthesizing...'):
-            output_path = generate_audio(uploaded_file, text_input)
-          with synthesized_audio:
-            st.header('Synthesized Audio')
-            st.audio(output_path, format='audio/wav')
         except:
           st.error('There was an issue synthesizing the text. Please check the input and try again. Remember, do not include punctuation.')
       else:

   title = f"""<h2 align="center" style="font-size: 1.2rem; margin-bottom: 2rem;">Make your favorite characters say anything!</h2>"""
   st.markdown(title, unsafe_allow_html=True)
+  sample_files = {
+    'Stewie Griffin': 'sample_inputs/stewie.wav',
+    'Donald Trump': 'sample_inputs/trump.wav',
+    'Joe Rogan': 'sample_inputs/rogan.wav'
+  }
   # Upload audio file
   uploaded_file = st.file_uploader('Add an audio file of the voice you want to clone...', type=['wav'])
+  selected_sample = st.selectbox('Or choose a sample:', list(sample_files.keys()))
+  speaker_file = sample_files[selected_sample] if uploaded_file is None else uploaded_file
+  if speaker_file:
+    st.header('Reference Audio')
+    st.audio(uploaded_file, format='audio/wav')
     # Input text
     text_input = st.text_input('What do you want your character to say? (Alphabet letters only, DO NOT INCLUDE PUNCTUATION)')
       if text_input:
         try:
           with st.spinner('Synthesizing...'):
+            output_path = generate_audio(speaker_file, text_input)
+          st.header('Synthesized Audio')
+          st.audio(output_path, format='audio/wav')
         except:
           st.error('There was an issue synthesizing the text. Please check the input and try again. Remember, do not include punctuation.')
       else:

sample_inputs/rogan.wav ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:7443710c741b5716007a7e89e0c9448779c23adbce258e78c84615dc0f7bd6d0
+size 8559872

sample_inputs/stewie.wav ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:8559147ae1b5ac2b7925365e42604d05764fd812a214bdcc60d1169f67b380e0
+size 5667310

sample_inputs/trump.wav ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:235b7d7b4d40d0a80808644964a5f01dbca68ebc7043a61f03661cebe9061437
+size 8698620