Use bare except to suppress llama.cpp __del__ errors

parent f9739fe3
...@@ -3650,6 +3650,7 @@ def main(): ...@@ -3650,6 +3650,7 @@ def main():
except ImportError: except ImportError:
# faster-whisper not available, try GGUF with llama.cpp # faster-whisper not available, try GGUF with llama.cpp
print("faster-whisper not available, trying GGUF with llama.cpp...") print("faster-whisper not available, trying GGUF with llama.cpp...")
audio_load_success = False
try: try:
from llama_cpp import Llama from llama_cpp import Llama
...@@ -3668,28 +3669,25 @@ def main(): ...@@ -3668,28 +3669,25 @@ def main():
model_path = download_model(model_to_use, cache_dir) model_path = download_model(model_to_use, cache_dir)
model_to_use = model_path model_to_use = model_path
# Load with llama.cpp (Vulkan) - suppress __del__ errors # Load with llama.cpp (Vulkan)
audio_model = None audio_model = Llama(
try: model_path=model_to_use,
audio_model = Llama( n_gpu_layers=-1, # All layers to GPU
model_path=model_to_use, n_ctx=2048,
n_gpu_layers=-1, # All layers to GPU verbose=False
n_ctx=2048, )
verbose=False
)
except BaseException:
audio_model = None
if audio_model is not None: # Store in multi_model_manager
# Store in multi_model_manager model_key = f"audio:{args.audio_model}"
model_key = f"audio:{args.audio_model}" multi_model_manager.add_model(model_key, audio_model)
multi_model_manager.add_model(model_key, audio_model) print(f"Audio model loaded successfully (GGUF/Vulkan)")
print(f"Audio model loaded successfully (GGUF/Vulkan)") audio_load_success = True
else:
raise Exception("llama.cpp failed to load model")
except Exception as e: except:
print(f"Warning: Could not pre-load audio model: {e}") pass # Ignore all errors, will load on-demand
if not audio_load_success:
print(f"Warning: Could not pre-load audio model (llama.cpp may not support this format)")
print("Audio model will load on-demand when transcription is requested.") print("Audio model will load on-demand when transcription is requested.")
except Exception as e: except Exception as e:
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment