Spaces:

playmak3r
/

Vibevoice-1.5B

Running

App Files Files Community

playmak3r commited on Oct 20

Commit

1e4e16f

1 Parent(s): b1c3b85

refactor: use class attributes for voices and examples directories in VibeVoiceDemo

Browse files

Files changed (1) hide show

model.py +23 -24

model.py CHANGED Viewed

@@ -31,6 +31,9 @@ def convert_to_16_bit_wav(data):
     return data
 class VibeVoiceDemo:
     def __init__(self, model_path: str, device: str = "cuda", inference_steps: int = 5, adapter_path: Optional[str] = None):
         """Initialize the VibeVoice demo with model loading."""
         self.model_path = model_path
@@ -148,43 +151,40 @@ class VibeVoiceDemo:
     def setup_voice_presets(self):
         """Setup voice presets by scanning the voices directory."""
-        voices_dir = os.path.join(os.path.dirname(__file__), "voices")
         # Check if voices directory exists
-        if not os.path.exists(voices_dir):
-            print(f"Warning: Voices directory not found at {voices_dir}")
             self.voice_presets = {}
             self.available_voices = {}
             return
         # Scan for all WAV files in the voices directory
         self.voice_presets = {}
         # Get all .wav files in the voices directory
-        wav_files = [f for f in os.listdir(voices_dir)
-                    if f.lower().endswith(('.wav', '.mp3', '.flac', '.ogg', '.m4a', '.aac')) and os.path.isfile(os.path.join(voices_dir, f))]
         # Create dictionary with filename (without extension) as key
         for wav_file in wav_files:
             # Remove .wav extension to get the name
             name = os.path.splitext(wav_file)[0]
-            # Create full path
-            full_path = os.path.join(voices_dir, wav_file)
             self.voice_presets[name] = full_path
         # Sort the voice presets alphabetically by name for better UI
         self.voice_presets = dict(sorted(self.voice_presets.items()))
         # Filter out voices that don't exist (this is now redundant but kept for safety)
         self.available_voices = {
             name: path for name, path in self.voice_presets.items()
             if os.path.exists(path)
         }
         if not self.available_voices:
             raise gr.Error("No voice presets found. Please add .wav files to the demo/voices directory.")
-        print(f"Found {len(self.available_voices)} voice files in {voices_dir}")
         print(f"Available voices: {', '.join(self.available_voices.keys())}")
     def read_audio(self, audio_path: str, target_sr: int = 24000) -> np.ndarray:
@@ -537,13 +537,13 @@ class VibeVoiceDemo:
                 refresh_negative=True,
                 is_prefill=voice_cloning_enabled,
             )
         except Exception as e:
             print(f"Error in generation thread: {e}")
             traceback.print_exc()
             # Make sure to end the stream on error
             audio_streamer.end()
     def stop_audio_generation(self):
         """Stop the current audio generation process."""
         self.stop_generation = True
@@ -553,23 +553,22 @@ class VibeVoiceDemo:
             except Exception as e:
                 print(f"Error stopping streamer: {e}")
         print("🛑 Audio generation stop requested")
     def load_example_scripts(self):
         """Load example scripts from the text_examples directory."""
-        examples_dir = os.path.join(os.path.dirname(__file__), "text_examples")
         self.example_scripts = []
         # Check if text_examples directory exists
-        if not os.path.exists(examples_dir):
-            print(f"Warning: text_examples directory not found at {examples_dir}")
             return
         # Get all .txt files in the text_examples directory
-        txt_files = sorted([f for f in os.listdir(examples_dir)
-                          if f.lower().endswith('.txt') and os.path.isfile(os.path.join(examples_dir, f))])
         for txt_file in txt_files:
-            file_path = os.path.join(examples_dir, txt_file)
             import re
             # Check if filename contains a time pattern like "45min", "90min", etc.

     return data
 class VibeVoiceDemo:
+    voices_dir = os.path.join(os.path.dirname(__file__), "voices")
+    examples_dir = os.path.join(os.path.dirname(__file__), "text_examples")
     def __init__(self, model_path: str, device: str = "cuda", inference_steps: int = 5, adapter_path: Optional[str] = None):
         """Initialize the VibeVoice demo with model loading."""
         self.model_path = model_path
     def setup_voice_presets(self):
         """Setup voice presets by scanning the voices directory."""
         # Check if voices directory exists
+        if not os.path.exists(self.voices_dir):
+            print(f"Warning: Voices directory not found at {self.voices_dir}")
             self.voice_presets = {}
             self.available_voices = {}
             return
         # Scan for all WAV files in the voices directory
         self.voice_presets = {}
         # Get all .wav files in the voices directory
+        wav_files = [f for f in os.listdir(self.voices_dir)
+                    if f.lower().endswith(('.wav', '.mp3', '.flac', '.ogg', '.m4a', '.aac')) and os.path.isfile(os.path.join(self.voices_dir, f))]
         # Create dictionary with filename (without extension) as key
         for wav_file in wav_files:
             # Remove .wav extension to get the name
             name = os.path.splitext(wav_file)[0]
+            full_path = os.path.join(self.voices_dir, wav_file)
             self.voice_presets[name] = full_path
         # Sort the voice presets alphabetically by name for better UI
         self.voice_presets = dict(sorted(self.voice_presets.items()))
         # Filter out voices that don't exist (this is now redundant but kept for safety)
         self.available_voices = {
             name: path for name, path in self.voice_presets.items()
             if os.path.exists(path)
         }
         if not self.available_voices:
             raise gr.Error("No voice presets found. Please add .wav files to the demo/voices directory.")
+        print(f"Found {len(self.available_voices)} voice files in {self.voices_dir}")
         print(f"Available voices: {', '.join(self.available_voices.keys())}")
     def read_audio(self, audio_path: str, target_sr: int = 24000) -> np.ndarray:
                 refresh_negative=True,
                 is_prefill=voice_cloning_enabled,
             )
         except Exception as e:
             print(f"Error in generation thread: {e}")
             traceback.print_exc()
             # Make sure to end the stream on error
             audio_streamer.end()
     def stop_audio_generation(self):
         """Stop the current audio generation process."""
         self.stop_generation = True
             except Exception as e:
                 print(f"Error stopping streamer: {e}")
         print("🛑 Audio generation stop requested")
     def load_example_scripts(self):
         """Load example scripts from the text_examples directory."""
         self.example_scripts = []
         # Check if text_examples directory exists
+        if not os.path.exists(self.examples_dir):
+            print(f"Warning: text_examples directory not found at {self.examples_dir}")
             return
         # Get all .txt files in the text_examples directory
+        txt_files = sorted([f for f in os.listdir(self.examples_dir)
+                          if f.lower().endswith('.txt') and os.path.isfile(os.path.join(self.examples_dir, f))])
         for txt_file in txt_files:
+            file_path = os.path.join(self.examples_dir, txt_file)
             import re
             # Check if filename contains a time pattern like "45min", "90min", etc.