Update codai/models/utils.py with full implementations

- Added complete check_hf_chat_template with global_args support - Added complete get_resolved_model_name - Added complete get_model_family with more model families - Added complete get_reasoning_stop_tokens for more model families - Added complete get_reasoning_system_prompt - Added set_global_args and get_global_args for configuration

Update codai/models/utils.py with full implementations
- Added complete check_hf_chat_template with global_args support - Added complete get_resolved_model_name - Added complete get_model_family with more model families - Added complete get_reasoning_stop_tokens for more model families - Added complete get_reasoning_system_prompt - Added set_global_args and get_global_args for configuration
9299c34f · Your Name · add2ecd1 · 9299c34f
Commit 9299c34f authored Mar 17, 2026 by Your Name
Show whitespace changes
Inline Side-by-side

Showing with 173 additions and 7 deletions

utils.py codai/models/utils.py +173 -7

No files found.
--- a/codai/models/utils.py
+++ b/codai/models/utils.py
 """Utility functions for model handling."""

-from typing import Optional
+from typing import Optional, Any
+
+
+# Global args - can be set by the application
+_global_args = None
+
+
+def set_global_args(args: Any):
+    """Set the global arguments object for use in utility functions."""
+    global _global_args
+    _global_args = args
+
+
+def get_global_args():
+    """Get the global arguments object."""
+    global _global_args
+    return _global_args


 def check_hf_chat_template(model_type: str = "text", model_name: str = None) -> tuple:
-    """Check if a model supports HF chat template."""
-    return (True, "chatml")
+    """
+    Check if HuggingFace chat template should be used for the model.
+    Returns a tuple (should_use, template_name) where template_name is the template to use or None for auto-detect.
+    
+    Args:
+        model_type: The model type ('text', 'image', etc.)
+        model_name: The specific model name (optional)
+    
+    Returns:
+        Tuple of (should_use: bool, template_name: str or None)
+        template_name is None means auto-detect from tokenizer
+    
+    Examples:
+        # Auto-detect and apply to all models
+        --hf-chat-template auto
+        
+        # Apply to all text models with auto-detect
+        --hf-chat-template text
+        
+        # Apply to specific model with auto-detect
+        --hf-chat-template text:llama-3.1
+        
+        # Apply to specific model with specific template
+        --hf-chat-template "llama-3.1:llama3"
+        --hf-chat-template "phi-3:chatml"
+    """
+    global_args = get_global_args()
+    hf_chat_template = getattr(global_args, 'hf_chat_template', []) if global_args else []
+    
+    # If empty list, HF chat template is not enabled
+    if not hf_chat_template:
+        return (False, None)
+    
+    for spec in hf_chat_template:
+        # Handle auto-detect - try to load HF tokenizer and auto-detect template
+        if spec == 'auto' or spec == '':
+            # Applies to all models when using 'auto'
+            return (True, None)
+        
+        # Check if this spec has a template specified after the model name
+        # Format: "model_name:template_name" or "type:model_name:template_name"
+        parts = spec.split(':')
+        
+        if len(parts) == 1:
+            # Just a type or single value
+            spec_val = parts[0]
+            if spec_val == model_type or spec_val == '*':
+                return (True, None)
+            # Check if it matches the model name directly (when model_type is part of the name)
+            if model_name and (spec_val in model_name or model_name in spec_val):
+                return (True, None)
+        elif len(parts) == 2:
+            # Format: "type:model_name" or "model_name:template"
+            spec_type = parts[0]
+            spec_model = parts[1]
+            
+            # Check if it's "text" or "image" type
+            if spec_type in ('text', 'image', '*'):
+                if spec_type == model_type or spec_type == '*':
+                    # Check if model name matches
+                    if spec_model == model_name or spec_model == '*':
+                        return (True, None)
+            else:
+                # It's "model_name:template" format
+                if model_name and (spec_model in model_name or model_name in spec_model):
+                    return (True, spec_type)  # spec_type is actually the template!
+        elif len(parts) == 3:
+            # Format: "type:model_name:template"
+            spec_type = parts[0]
+            spec_model = parts[1]
+            spec_template = parts[2]
+            
+            if spec_type == model_type or spec_type == '*':
+                if spec_model == model_name or spec_model == '*':
+                    return (True, spec_template)
+    
+    return (False, None)


 def get_resolved_model_name(requested_model: str, current_manager = None) -> str:
-    """Get the resolved model name."""
+    """
+    Get the actual model name to return in the response.
+    
+    Handles aliases and ensures the correct model identifier is returned.
+    """
+    global_args = get_global_args()
+    
+    # Get model aliases from args if available
+    model_aliases = getattr(global_args, 'model_aliases', {}) if global_args else {}
+    
+    # If it's an alias, return the resolved name
+    if requested_model in model_aliases:
+        return model_aliases[requested_model]
+    
+    # Try to get from current manager if available
+    if current_manager is not None:
+        # Check if the model is loaded in the manager
+        if hasattr(current_manager, 'models'):
+            for key, model in current_manager.models.items():
+                if requested_model == key or requested_model in key:
+                    return key
+        if hasattr(current_manager, 'default_model'):
+            if requested_model == "default":
+                return current_manager.default_model
+    
+    # Check if it's a HuggingFace model ID - if so, return as-is
+    if '/' in requested_model:
+        return requested_model
+    
+    # Check if it's a URL - return as-is
+    if requested_model.startswith('http://') or requested_model.startswith('https://'):
+        return requested_model
+    
+    # Otherwise return as-is
    return requested_model


 def get_model_family(model_name: str) -> str:
    """Detect model family from model name."""
+    if not model_name:
+        return 'generic'
+    
    model_lower = model_name.lower()
+    
+    # Check for reasoning models first
+    if 'reasoning' in model_lower or 'deepseek-r1' in model_lower:
+        return 'deepseek'
+    
    if 'qwen' in model_lower:
+        if 'qwen3' in model_lower or 'qwen3.5' in model_lower:
+            return 'qwen3'
+        elif 'qwen2' in model_lower:
+            return 'qwen2'
        return 'qwen'
    if 'llama' in model_lower:
+        if 'llama4' in model_lower:
+            return 'llama4'
+        elif 'llama3' in model_lower:
+            return 'llama3'
        return 'llama'
-    if 'mistral' in model_lower:
+    if 'mistral' in model_lower or 'mixtral' in model_lower:
        return 'mistral'
    if 'deepseek' in model_lower:
        return 'deepseek'
@@ -30,6 +170,10 @@ def get_model_family(model_name: str) -> str:
        return 'yi'
    if 'hermes' in model_lower:
        return 'hermes'
+    if 'phi' in model_lower:
+        return 'phi'
+    if 'command-r' in model_lower:
+        return 'command-r'
    return 'generic'


@@ -38,7 +182,13 @@ def get_reasoning_stop_tokens(model_family: str) -> tuple:
    
    Returns tuple of (start_token, end_token, additional_stops)
    """
-    if model_family == 'qwen':
+    if model_family == 'qwen3':
+        return (
+            "<|im_start|>assistant\n",
+            "<|im_end|>",
+            ["<|im_end|>", "<|endoftext|>", "<|im_start|>"]
+        )
+    elif model_family == 'qwen2' or model_family == 'qwen':
        return (
            "<|im_start|>assistant\n",
            "<|im_end|>",
@@ -80,6 +230,18 @@ def get_reasoning_stop_tokens(model_family: str) -> tuple:
            "<|im_end|>",
            ["<|im_end|>", "<|endoftext|>"]
        )
+    elif model_family == 'phi':
+        return (
+            "<|assistant|>\n",
+            "<|end|>",
+            ["<|end|>", "<|endoftext|>", "<|user|>", "<|system|>"]
+        )
+    elif model_family == 'command-r':
+        return (
+            "<|start|>assistant\n",
+            "<|end|>",
+            ["<|end|>", "<|endoftext|>", "<|start|>"]
+        )
    else:
        # Default fallback - try common tokens
        return (
@@ -92,7 +254,7 @@ def get_reasoning_stop_tokens(model_family: str) -> tuple:
 def get_reasoning_system_prompt(model_family: str) -> str:
    """Get system prompt injection for forcing reasoning on non-native models."""
    
-    if model_family == 'qwen':
+    if model_family in ('qwen3', 'qwen2', 'qwen'):
        return "You must reason step-by-step inside <thought> tags before every response."
    elif model_family == 'deepseek':
        return "You must reason step-by-step inside <thought> tags before every response."
@@ -104,5 +266,9 @@ def get_reasoning_system_prompt(model_family: str) -> str:
        return "You must reason step-by-step inside <thought> tags before every response. Use <start_of_turn>model for your response."
    elif model_family in ('yi', 'hermes'):
        return "You must reason step-by-step inside <|im_start|>assistant tags before every response."
+    elif model_family == 'phi':
+        return "You must reason step-by-step inside <|assistant> tags before every response."
+    elif model_family == 'command-r':
+        return "You must reason step-by-step before every response."
    else:
        return "You must reason step-by-step before every response."