Upload fine-tuned model, tokenizer, and supporting files for modernbert-imdb-sentiment

Browse files

Files changed (2) hide show

config.yaml +1 -0
inference.py +83 -35

config.yaml CHANGED Viewed

@@ -4,6 +4,7 @@ model:
   max_length: 880 # 256
   dropout: 0.1
   pooling_strategy: "mean" # Current default, change as needed
 inference:
   # Default path, can be overridden

   max_length: 880 # 256
   dropout: 0.1
   pooling_strategy: "mean" # Current default, change as needed
+  num_weighted_layers: 6 # Match original training config
 inference:
   # Default path, can be overridden

inference.py CHANGED Viewed

@@ -1,58 +1,106 @@
 import torch
 from transformers import AutoTokenizer, AutoModelForSequenceClassification, ModernBertConfig
-# models.py (containing ModernBertForSentiment) will be loaded from the Hub due to trust_remote_code=True
 from typing import Dict, Any
 import yaml
 class SentimentInference:
     def __init__(self, config_path: str = "config.yaml"):
-        """Load configuration and initialize model and tokenizer from Hugging Face Hub."""
         with open(config_path, 'r') as f:
             config_data = yaml.safe_load(f)
         model_yaml_cfg = config_data.get('model', {})
         inference_yaml_cfg = config_data.get('inference', {})
         model_hf_repo_id = model_yaml_cfg.get('name_or_path')
-        if not model_hf_repo_id:
-            raise ValueError("model.name_or_path must be specified in config.yaml (e.g., 'username/model_name')")
         tokenizer_hf_repo_id = model_yaml_cfg.get('tokenizer_name_or_path', model_hf_repo_id)
         self.max_length = inference_yaml_cfg.get('max_length', model_yaml_cfg.get('max_length', 512))
-        print(f"Loading tokenizer from: {tokenizer_hf_repo_id}")
-        self.tokenizer = AutoTokenizer.from_pretrained(tokenizer_hf_repo_id)
-        print(f"Loading base ModernBertConfig from: {model_hf_repo_id}")
-        # Load the config that was uploaded with the model (config.json in the HF repo)
-        # This config should already have the correct architecture defined by ModernBertConfig.
-        # We then augment it with any custom parameters needed by ModernBertForSentiment's __init__.
-        loaded_config = ModernBertConfig.from_pretrained(model_hf_repo_id)
-        # Augment loaded_config with parameters from model_yaml_cfg needed for ModernBertForSentiment initialization
-        # These should reflect how the model was trained and its specific custom head.
-        loaded_config.pooling_strategy = model_yaml_cfg.get('pooling_strategy', 'mean') # Default to 'mean' as per your models.py change
-        loaded_config.num_weighted_layers = model_yaml_cfg.get('num_weighted_layers', 4)
-        loaded_config.classifier_dropout = model_yaml_cfg.get('dropout') # Allow None if not in yaml
-        # num_labels should ideally be in the config.json uploaded to HF, but can be set here if needed.
-        # For binary sentiment with a single logit output, num_labels is 1.
-        loaded_config.num_labels = model_yaml_cfg.get('num_labels', 1)
-        # The loss_function might not be strictly needed for inference if the model doesn't use it in forward pass for eval,
-        # but if ModernBertForSentiment.__init__ requires it, it must be provided.
-        # Assuming it's not critical for basic inference here to simplify.
-        # loaded_config.loss_function = model_yaml_cfg.get('loss_function', {'name': '...', 'params': {}})
-        print(f"Instantiating and loading model weights for {model_hf_repo_id}...")
-        # trust_remote_code=True allows loading models.py (containing ModernBertForSentiment)
-        # from the Hugging Face model repository.
-        self.model = AutoModelForSequenceClassification.from_pretrained(
-            model_hf_repo_id,
-            config=loaded_config, # Pass the augmented config
-            trust_remote_code=True
-        )
         self.model.eval()
-        print(f"Model {model_hf_repo_id} loaded successfully from Hugging Face Hub.")
     def predict(self, text: str) -> Dict[str, Any]:
         inputs = self.tokenizer(text, return_tensors="pt", truncation=True, max_length=self.max_length, padding=True)

 import torch
 from transformers import AutoTokenizer, AutoModelForSequenceClassification, ModernBertConfig
 from typing import Dict, Any
 import yaml
+import os
+from models import ModernBertForSentiment
 class SentimentInference:
     def __init__(self, config_path: str = "config.yaml"):
+        """Load configuration and initialize model and tokenizer from local checkpoint or Hugging Face Hub."""
+        print(f"--- Debug: SentimentInference __init__ received config_path: {config_path} ---") # Add this
         with open(config_path, 'r') as f:
             config_data = yaml.safe_load(f)
+        print(f"--- Debug: SentimentInference loaded config_data: {config_data} ---") # Add this
         model_yaml_cfg = config_data.get('model', {})
         inference_yaml_cfg = config_data.get('inference', {})
         model_hf_repo_id = model_yaml_cfg.get('name_or_path')
         tokenizer_hf_repo_id = model_yaml_cfg.get('tokenizer_name_or_path', model_hf_repo_id)
+        local_model_weights_path = inference_yaml_cfg.get('model_path') # Path for local .pt file
+        print(f"--- Debug: model_hf_repo_id: {model_hf_repo_id} ---") # Add this
+        print(f"--- Debug: local_model_weights_path: {local_model_weights_path} ---") # Add this
         self.max_length = inference_yaml_cfg.get('max_length', model_yaml_cfg.get('max_length', 512))
+        # --- Tokenizer Loading (always from Hub for now, or could be made conditional) ---
+        if not tokenizer_hf_repo_id and not model_hf_repo_id:
+            raise ValueError("Either model.tokenizer_name_or_path or model.name_or_path (as fallback for tokenizer) must be specified in config.yaml")
+        effective_tokenizer_repo_id = tokenizer_hf_repo_id or model_hf_repo_id
+        print(f"Loading tokenizer from: {effective_tokenizer_repo_id}")
+        self.tokenizer = AutoTokenizer.from_pretrained(effective_tokenizer_repo_id)
+        # --- Model Loading --- #
+        # Determine if we are loading from a local .pt file or from Hugging Face Hub
+        load_from_local_pt = False
+        if local_model_weights_path and os.path.isfile(local_model_weights_path):
+            print(f"Found local model weights path: {local_model_weights_path}")
+            print(f"--- Debug: Found local model weights path: {local_model_weights_path} ---") # Add this
+            load_from_local_pt = True
+        elif not model_hf_repo_id:
+            raise ValueError("No local model_path found and model.name_or_path (for Hub) is not specified in config.yaml")
+        print(f"--- Debug: load_from_local_pt is: {load_from_local_pt} ---") # Add this
+        if load_from_local_pt:
+            print("Attempting to load model from local .pt checkpoint...")
+            print("--- Debug: Entering LOCAL .pt loading path ---") # Add this
+            # Base BERT config must still be loaded, usually from a Hub ID (e.g., original base model)
+            # This base_model_for_config_id is crucial for building the correct ModernBertForSentiment structure.
+            base_model_for_config_id = model_yaml_cfg.get('base_model_for_config', model_hf_repo_id or tokenizer_hf_repo_id)
+            print(f"--- Debug: base_model_for_config_id (for local .pt): {base_model_for_config_id} ---") # Add this
+            if not base_model_for_config_id:
+                 raise ValueError("For local .pt loading, model.base_model_for_config must be specified in config.yaml (e.g., 'answerdotai/ModernBERT-base') to build the model structure.")
+            print(f"Loading ModernBertConfig for structure from: {base_model_for_config_id}")
+            bert_config = ModernBertConfig.from_pretrained(base_model_for_config_id)
+            # Augment config with parameters from model_yaml_cfg
+            bert_config.pooling_strategy = model_yaml_cfg.get('pooling_strategy', 'mean')
+            bert_config.num_weighted_layers = model_yaml_cfg.get('num_weighted_layers', 4)
+            bert_config.classifier_dropout = model_yaml_cfg.get('dropout')
+            bert_config.num_labels = model_yaml_cfg.get('num_labels', 1)
+            # bert_config.loss_function = model_yaml_cfg.get('loss_function') # If needed by __init__
+            print("Instantiating ModernBertForSentiment model structure...")
+            self.model = ModernBertForSentiment(bert_config)
+            print(f"Loading model weights from local checkpoint: {local_model_weights_path}")
+            checkpoint = torch.load(local_model_weights_path, map_location=torch.device('cpu'))
+            if isinstance(checkpoint, dict) and 'model_state_dict' in checkpoint:
+                model_state_to_load = checkpoint['model_state_dict']
+            else:
+                model_state_to_load = checkpoint # Assume it's the state_dict itself
+            self.model.load_state_dict(model_state_to_load)
+            print(f"Model loaded successfully from local checkpoint: {local_model_weights_path}.")
+        else: # Load from Hugging Face Hub
+            print(f"Attempting to load model from Hugging Face Hub: {model_hf_repo_id}...")
+            print(f"--- Debug: Entering HUGGING FACE HUB loading path ---") # Add this
+            print(f"--- Debug: model_hf_repo_id (for Hub loading): {model_hf_repo_id} ---") # Add this
+            if not model_hf_repo_id:
+                raise ValueError("model.name_or_path must be specified in config.yaml for Hub loading.")
+            print(f"Loading base ModernBertConfig from: {model_hf_repo_id}")
+            loaded_config = ModernBertConfig.from_pretrained(model_hf_repo_id)
+            # Augment loaded_config
+            loaded_config.pooling_strategy = model_yaml_cfg.get('pooling_strategy', 'mean')
+            loaded_config.num_weighted_layers = model_yaml_cfg.get('num_weighted_layers', 6) # Default to 6 now
+            loaded_config.classifier_dropout = model_yaml_cfg.get('dropout')
+            loaded_config.num_labels = model_yaml_cfg.get('num_labels', 1)
+            print(f"Instantiating and loading model weights for {model_hf_repo_id}...")
+            self.model = AutoModelForSequenceClassification.from_pretrained(
+                model_hf_repo_id,
+                config=loaded_config,
+                trust_remote_code=True
+            )
+            print(f"Model {model_hf_repo_id} loaded successfully from Hugging Face Hub.")
         self.model.eval()
     def predict(self, text: str) -> Dict[str, Any]:
         inputs = self.tokenizer(text, return_tensors="pt", truncation=True, max_length=self.max_length, padding=True)