Created Config and Used New Approach for Model Download Bars Display

UtkarshTheDev · UtkarshTheDev · commit c3a0a92112be · 2025-05-16T20:30:13.000+05:30
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -2,6 +2,20 @@
 
 All notable changes to LocalLab will be documented in this file.
 
+## [0.6.4] - 2025-05-16
+
+### Improved
+
+- Completely redesigned model downloading experience with proper native Hugging Face progress bars
+- Created new early configuration system to set up logging before any Hugging Face libraries are imported
+- Implemented StdoutRedirector to ensure proper display of progress bars during model downloads
+- Temporarily disabled all logging handlers during model downloads to prevent interference
+- Added clear visual separation between LocalLab logs and Hugging Face progress bars
+- Set environment variables to optimize Hugging Face download experience
+- Configured transformers library to use native progress bars for model downloads
+- Added informative messages before and after model downloads for better user experience
+- Ensured consistent progress bar display across different model types and sizes
+
 ## [0.6.3] - 2025-05-16
 
 ### Improved
@@ -12,9 +26,6 @@ All notable changes to LocalLab will be documented in this file.
 - Improved configuration of Hugging Face Hub progress bars for better visual experience
 - Completely bypassed custom logging for Hugging Face download-related logs
 - Configured transformers library to use native progress bars for model downloads
-- Disabled logger propagation for HuggingFace-related modules during downloads
-- Added proper spacing before and after progress bars for better readability
-- Enhanced progress bar detection to catch all download-related progress indicators
 
 ## [0.6.2] - 2025-05-04
 
diff --git a/locallab/__init__.py b/locallab/__init__.py
@@ -2,14 +2,21 @@
 LocalLab - A lightweight AI inference server for running LLMs locally
 """
 
-__version__ = "0.6.3"  # Updated to improve model downloading experience and fix CLI settings
+# Import early configuration first to set up logging and environment variables
+# This ensures Hugging Face's progress bars are displayed correctly
+from .utils.early_config import enable_hf_progress_bars
+
+__version__ = "0.6.4"  # Updated to improve model downloading experience and fix CLI settings
 
 # Only import what's necessary initially, lazy-load the rest
 from .logger import get_logger
 
 # Explicitly expose start_server for direct import
 from .server import start_server, cli
 
+# Enable Hugging Face progress bars with native display
+enable_hf_progress_bars()
+
 # Other imports will be lazy-loaded when needed
 # from .config import MODEL_REGISTRY, DEFAULT_MODEL
 # from .model_manager import ModelManager
diff --git a/locallab/model_manager.py b/locallab/model_manager.py
@@ -1,8 +1,11 @@
+# Import early configuration module first to set up logging and environment variables
+# This ensures Hugging Face's progress bars are displayed correctly
+from .utils.early_config import enable_hf_progress_bars, StdoutRedirector
+
 from .config import HF_TOKEN_ENV, get_env_var, set_env_var
 import os
 import logging
 import torch
-from transformers import AutoTokenizer, AutoModelForCausalLM, BitsAndBytesConfig
 from typing import Optional, Generator, Dict, Any, List, Union, Callable, AsyncGenerator
 from fastapi import HTTPException
 import time
@@ -13,7 +16,6 @@
 )
 from .logger.logger import logger, log_model_loaded, log_model_unloaded
 from .utils import check_resource_availability, get_device, format_model_size
-from .utils.progress import configure_hf_hub_progress
 import gc
 from colorama import Fore, Style
 import asyncio
@@ -22,20 +24,12 @@
 import tempfile
 import json
 
-# Configure HuggingFace Hub progress bars to use native display
+# Enable Hugging Face progress bars with native display
 # This ensures we see the visually appealing progress bars from HuggingFace
-configure_hf_hub_progress()
-
-# Also configure transformers to use HuggingFace Hub's progress bars
-try:
-    import transformers
-    transformers.utils.logging.enable_progress_bar()
-    # Set transformers logging to only show warnings and errors
-    transformers.logging.set_verbosity_warning()
-except ImportError:
-    logger.debug("Could not configure transformers progress bars")
-except Exception as e:
-    logger.debug(f"Error configuring transformers progress bars: {str(e)}")
+enable_hf_progress_bars()
+
+# Import transformers after configuring logging to ensure proper display
+from transformers import AutoTokenizer, AutoModelForCausalLM, BitsAndBytesConfig
 
 QUANTIZATION_SETTINGS = {
     "fp16": {
@@ -280,52 +274,41 @@ async def _load_model_with_optimizations(self, model_id: str):
             # Add an empty line to separate from HuggingFace progress bars
             print("")
 
-            # Set a flag to indicate we're downloading a model
-            # This will help our logger know to let HuggingFace's progress bars through
-            try:
-                # Access the module's global variable
-                import locallab.utils.progress
-                locallab.utils.progress.is_downloading = True
-
-                # Ensure HuggingFace Hub's progress bars are enabled
-                from huggingface_hub.utils import logging as hf_logging
-                hf_logging.enable_progress_bars()
-
-                # Configure transformers to use progress bars
-                import transformers
-                transformers.utils.logging.enable_progress_bar()
-
-                # Also ensure tqdm is properly configured for nice display
-                import tqdm
-                tqdm.tqdm.monitor_interval = 0  # Disable monitor thread which can cause issues
+            # Add an empty line before progress bars start
+            print(f"\n{Fore.CYAN}Starting model download - native progress bars will appear below{Style.RESET_ALL}\n")
+
+            # Enable Hugging Face progress bars again to ensure they're properly configured
+            enable_hf_progress_bars()
+
+            # Use a context manager to ensure proper display of Hugging Face progress bars
+            with StdoutRedirector(disable_logging=True):
+                # Load tokenizer first
+                logger.info(f"Loading tokenizer for {model_id}...")
+                self.tokenizer = AutoTokenizer.from_pretrained(
+                    model_id,
+                    token=hf_token if hf_token else None
+                )
+                logger.info(f"Tokenizer loaded successfully")
 
-                # Temporarily disable our custom logger for HuggingFace logs
-                import logging
-                for logger_name in ['tqdm', 'huggingface_hub', 'transformers', 'filelock']:
-                    logging.getLogger(logger_name).handlers = []  # Remove any handlers
-                    logging.getLogger(logger_name).propagate = False  # Don't propagate to parent loggers
-            except:
-                # Fallback if import fails
-                pass
+                # Load model with optimizations
+                logger.info(f"Loading model weights for {model_id}...")
 
-            # Add an empty line before progress bars start
-            print("\n")
+                # This is the critical part where we want to see nice progress bars
+                # We'll temporarily disable our logger's handlers to prevent interference
+                root_logger = logging.getLogger()
+                original_handlers = root_logger.handlers.copy()
+                root_logger.handlers = []
 
-            # Load tokenizer first
-            logger.info(f"Loading tokenizer for {model_id}...")
-            self.tokenizer = AutoTokenizer.from_pretrained(
-                model_id,
-                token=hf_token if hf_token else None
-            )
-            logger.info(f"Tokenizer loaded successfully")
-
-            # Load model with optimizations
-            logger.info(f"Loading model weights for {model_id}...")
-            self.model = AutoModelForCausalLM.from_pretrained(
-                model_id,
-                token=hf_token if hf_token else None,
-                **quant_config
-            )
+                try:
+                    # Load the model with Hugging Face's native progress bars
+                    self.model = AutoModelForCausalLM.from_pretrained(
+                        model_id,
+                        token=hf_token if hf_token else None,
+                        **quant_config
+                    )
+                finally:
+                    # Restore our logger's handlers
+                    root_logger.handlers = original_handlers
             # Reset the downloading flag
             try:
                 # Access the module's global variable
@@ -1106,47 +1089,41 @@ async def load_custom_model(self, model_name: str, fallback_model: Optional[str]
             # Add an empty line to separate from HuggingFace progress bars
             print("")
 
-            # Set a flag to indicate we're downloading a model
-            try:
-                # Access the module's global variable
-                import locallab.utils.progress
-                locallab.utils.progress.is_downloading = True
-
-                # Ensure HuggingFace Hub's progress bars are enabled
-                from huggingface_hub.utils import logging as hf_logging
-                hf_logging.enable_progress_bars()
+            # Add an empty line before progress bars start
+            print(f"\n{Fore.CYAN}Starting custom model download - native progress bars will appear below{Style.RESET_ALL}\n")
 
-                # Configure transformers to use progress bars
-                import transformers
-                transformers.utils.logging.enable_progress_bar()
+            # Enable Hugging Face progress bars again to ensure they're properly configured
+            enable_hf_progress_bars()
 
-                # Also ensure tqdm is properly configured for nice display
-                import tqdm
-                tqdm.tqdm.monitor_interval = 0  # Disable monitor thread which can cause issues
+            # Use a context manager to ensure proper display of Hugging Face progress bars
+            with StdoutRedirector(disable_logging=True):
+                # Load tokenizer first
+                logger.info(f"Loading tokenizer for custom model {model_name}...")
 
-                # Temporarily disable our custom logger for HuggingFace logs
-                import logging
-                for logger_name in ['tqdm', 'huggingface_hub', 'transformers', 'filelock']:
-                    logging.getLogger(logger_name).handlers = []  # Remove any handlers
-                    logging.getLogger(logger_name).propagate = False  # Don't propagate to parent loggers
-            except:
-                # Fallback if import fails
-                pass
+                # This is the critical part where we want to see nice progress bars
+                # We'll temporarily disable our logger's handlers to prevent interference
+                root_logger = logging.getLogger()
+                original_handlers = root_logger.handlers.copy()
+                root_logger.handlers = []
 
-            # Add an empty line before progress bars start
-            print("\n")
-
-            self.tokenizer = AutoTokenizer.from_pretrained(model_name)
-            logger.info(f"Tokenizer loaded successfully")
-
-            # Load model with optimizations
-            logger.info(f"Loading model weights for custom model {model_name}...")
-            self.model = AutoModelForCausalLM.from_pretrained(
-                model_name,
-                torch_dtype=torch.float16,
-                device_map="auto",
-                quantization_config=quant_config
-            )
+                try:
+                    # Load tokenizer with Hugging Face's native progress bars
+                    self.tokenizer = AutoTokenizer.from_pretrained(model_name)
+                    logger.info(f"Tokenizer loaded successfully")
+
+                    # Load model with optimizations
+                    logger.info(f"Loading model weights for custom model {model_name}...")
+
+                    # Load the model with Hugging Face's native progress bars
+                    self.model = AutoModelForCausalLM.from_pretrained(
+                        model_name,
+                        torch_dtype=torch.float16,
+                        device_map="auto",
+                        quantization_config=quant_config
+                    )
+                finally:
+                    # Restore our logger's handlers
+                    root_logger.handlers = original_handlers
             # Reset the downloading flag
             try:
                 # Access the module's global variable
diff --git a/locallab/utils/early_config.py b/locallab/utils/early_config.py
@@ -0,0 +1,100 @@
+"""
+Early configuration module for LocalLab.
+This module is imported before any other modules to configure logging and environment variables.
+"""
+
+import os
+import sys
+import logging
+import warnings
+
+# Configure environment variables for Hugging Face
+os.environ["HF_HUB_ENABLE_HF_TRANSFER"] = "1"  # Enable HF Transfer for better downloads
+os.environ["TOKENIZERS_PARALLELISM"] = "true"  # Enable parallelism for tokenizers
+os.environ["TRANSFORMERS_NO_ADVISORY_WARNINGS"] = "1"  # Disable advisory warnings
+os.environ["HF_HUB_DISABLE_TELEMETRY"] = "1"  # Disable telemetry
+
+# Configure tqdm to use the best available display method
+os.environ["TQDM_DISABLE"] = "0"  # Ensure tqdm is not disabled
+os.environ["TQDM_MININTERVAL"] = "0.1"  # Update progress bars more frequently
+
+# Configure Hugging Face logging before importing any HF libraries
+def configure_hf_logging():
+    """
+    Configure Hugging Face logging before any HF libraries are imported.
+    This ensures that HF's progress bars are displayed correctly.
+    """
+    # Disable all warnings
+    warnings.filterwarnings("ignore")
+    
+    # Configure logging for Hugging Face libraries
+    for logger_name in ["transformers", "huggingface_hub", "accelerate", "tqdm", "filelock"]:
+        hf_logger = logging.getLogger(logger_name)
+        hf_logger.setLevel(logging.WARNING)  # Only show warnings and errors
+        hf_logger.propagate = False  # Don't propagate to parent loggers
+        
+        # Remove any existing handlers
+        for handler in hf_logger.handlers[:]:
+            hf_logger.removeHandler(handler)
+        
+        # Add a null handler to prevent warnings about no handlers
+        hf_logger.addHandler(logging.NullHandler())
+
+# Run configuration immediately on import
+configure_hf_logging()
+
+# Function to temporarily redirect stdout/stderr during model downloads
+class StdoutRedirector:
+    """
+    Context manager to temporarily redirect stdout/stderr during model downloads.
+    This ensures that tqdm progress bars are displayed correctly.
+    """
+    def __init__(self, disable_logging=True):
+        self.disable_logging = disable_logging
+        self.original_stdout = sys.stdout
+        self.original_stderr = sys.stderr
+        self.original_log_levels = {}
+    
+    def __enter__(self):
+        # Store original log levels
+        if self.disable_logging:
+            for logger_name in ["transformers", "huggingface_hub", "accelerate", "tqdm", "filelock"]:
+                logger = logging.getLogger(logger_name)
+                self.original_log_levels[logger_name] = logger.level
+                logger.setLevel(logging.WARNING)
+        
+        return self
+    
+    def __exit__(self, exc_type, exc_val, exc_tb):
+        # Restore original log levels
+        if self.disable_logging:
+            for logger_name, level in self.original_log_levels.items():
+                logging.getLogger(logger_name).setLevel(level)
+
+# Function to enable Hugging Face progress bars
+def enable_hf_progress_bars():
+    """
+    Enable Hugging Face progress bars.
+    Call this function before downloading models.
+    """
+    # Configure tqdm
+    try:
+        import tqdm
+        tqdm.tqdm.monitor_interval = 0  # Disable monitor thread
+    except ImportError:
+        pass
+    
+    # Configure huggingface_hub
+    try:
+        import huggingface_hub
+        huggingface_hub.enable_progress_bars()
+    except ImportError:
+        pass
+    
+    # Configure transformers
+    try:
+        import transformers
+        transformers.utils.logging.enable_progress_bar()
+        transformers.logging.set_verbosity_warning()
+    except ImportError:
+        pass
diff --git a/setup.py b/setup.py
@@ -47,7 +47,7 @@
 
 setup(
     name="locallab",
-    version="0.6.3",
+    version="0.6.4",
     packages=find_packages(include=["locallab", "locallab.*"]),
     install_requires=install_requires,
     extras_require={