Add audio generation capabilities to web interface

parent b6d177d8
#!/usr/bin/env python3
import sys
import os
sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
from videogen import MODELS, detect_model_type
for name, info in MODELS.items():
if name == "wan2_2_i2v_a14b":
print("Name:", name)
print("ID:", info.get("id"))
print("Class:", info.get("class"))
print("Supports I2V:", info.get("supports_i2v"))
print("Tags:", info.get("tags"))
print("Capabilities:", detect_model_type(info))
......@@ -261,26 +261,26 @@ def build_command(params: Dict) -> List[str]:
# Audio options
if params.get('generate_audio'):
cmd.append('--generate-audio')
cmd.append('--generate_audio')
if params.get('audio_type'):
cmd.extend(['--audio-type', params['audio_type']])
cmd.extend(['--audio_type', params['audio_type']])
# Use appropriate text/prompt based on audio type
if params.get('audio_type') == 'music' and params.get('music_prompt'):
cmd.extend(['--audio-text', params['music_prompt']])
cmd.extend(['--audio_text', params['music_prompt']])
elif params.get('audio_text'):
cmd.extend(['--audio-text', params['audio_text']])
cmd.extend(['--audio_text', params['audio_text']])
if params.get('tts_voice'):
cmd.extend(['--tts-voice', params['tts_voice']])
cmd.extend(['--tts_voice', params['tts_voice']])
if params.get('sync_audio'):
cmd.append('--sync-audio')
cmd.append('--sync_audio')
if params.get('audio_sync_mode'):
cmd.extend(['--audio-sync-mode', params['audio_sync_mode']])
cmd.extend(['--sync_mode', params['audio_sync_mode']])
if params.get('lip_sync'):
cmd.append('--lip-sync')
cmd.append('--lip_sync')
if params.get('lip_sync_method'):
cmd.extend(['--lip-sync-method', params['lip_sync_method']])
cmd.extend(['--lip_sync_method', params['lip_sync_method']])
# Dubbing/Translation
if params.get('dub_video'):
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment