abhilash88
/

age-gender-prediction

@@ -1,8 +1,8 @@
 """
-Age-Gender Prediction Model with Working One-Liner Pipeline
-Based on Hugging Face official documentation and best practices
-Usage:
 from transformers import pipeline
 classifier = pipeline("image-classification", model="abhilash88/age-gender-prediction", trust_remote_code=True)
 result = classifier("image.jpg")
@@ -14,131 +14,91 @@ import torch.nn as nn
 from transformers import (
     ViTModel,
     ViTImageProcessor,
-    PreTrainedModel,
-    PretrainedConfig,
-    ImageClassificationPipeline,
-    Pipeline
 )
 from PIL import Image
 import numpy as np
-class AgeGenderConfig(PretrainedConfig):
-    """Configuration class following HuggingFace standards"""
-    model_type = "age-gender-vit"
-    def __init__(self, **kwargs):
-        super().__init__(**kwargs)
-        self.vit_model_name = kwargs.get("vit_model_name", "google/vit-base-patch16-224")
-        self.hidden_size = kwargs.get("hidden_size", 768)
-        self.intermediate_size = kwargs.get("intermediate_size", 256)
-        self.final_size = kwargs.get("final_size", 64)
-        self.dropout_rate = kwargs.get("dropout_rate", 0.1)
-class AgeGenderViTModel(PreTrainedModel):
-    """Age-Gender ViT Model following HuggingFace standards"""
-    config_class = AgeGenderConfig
-    def __init__(self, config=None):
-        if config is None:
-            config = AgeGenderConfig()
         super().__init__(config)
-        self.vit = ViTModel.from_pretrained("google/vit-base-patch16-224")
         # Age head: 768 → 256 → 64 → 1
         self.age_head = nn.Sequential(
-            nn.Linear(768, 256), nn.ReLU(), nn.Dropout(0.1),
-            nn.Linear(256, 64), nn.ReLU(), nn.Dropout(0.1),
             nn.Linear(64, 1)
         )
         # Gender head: 768 → 256 → 64 → 1
         self.gender_head = nn.Sequential(
-            nn.Linear(768, 256), nn.ReLU(), nn.Dropout(0.1),
-            nn.Linear(256, 64), nn.ReLU(), nn.Dropout(0.1),
-            nn.Linear(64, 1), nn.Sigmoid()
         )
-        # Required for some pipeline compatibility
-        self.classifier = nn.Linear(2, 2)
-    def forward(self, pixel_values, **kwargs):
         """Forward pass returning logits for pipeline"""
-        vit_outputs = self.vit(pixel_values=pixel_values)
-        pooled_output = vit_outputs.pooler_output
         age_output = self.age_head(pooled_output)
         gender_output = self.gender_head(pooled_output)
-        # Create concatenated logits for pipeline processing
         logits = torch.cat([age_output, gender_output], dim=1)
         return {"logits": logits}
 class AgeGenderImageClassificationPipeline(ImageClassificationPipeline):
-    """
-    Custom pipeline following HuggingFace documentation standards
-    Reference: https://huggingface.co/docs/transformers/add_new_pipeline
-    """
-    def _sanitize_parameters(self, **kwargs):
-        """Sanitize parameters following HF guidelines"""
-        preprocess_kwargs = {}
-        postprocess_kwargs = {}
-        # Handle any custom parameters here if needed
-        if "top_k" in kwargs:
-            postprocess_kwargs["top_k"] = kwargs["top_k"]
-        return preprocess_kwargs, {}, postprocess_kwargs
-    def preprocess(self, inputs, **kwargs):
-        """Preprocess inputs following HF guidelines"""
-        # Handle different input types
-        if isinstance(inputs, str):
-            if inputs.startswith(('http://', 'https://')):
-                import requests
-                from io import BytesIO
-                response = requests.get(inputs)
-                inputs = Image.open(BytesIO(response.content)).convert('RGB')
-            else:
-                inputs = Image.open(inputs).convert('RGB')
-        elif isinstance(inputs, np.ndarray):
-            inputs = Image.fromarray(inputs).convert('RGB')
-        elif not isinstance(inputs, Image.Image):
-            inputs = inputs.convert('RGB')
-        # Use the model's image processor
-        return super().preprocess(inputs, **kwargs)
-    def _forward(self, model_inputs, **kwargs):
-        """Forward pass following HF guidelines"""
-        return self.model(**model_inputs)
     def postprocess(self, model_outputs, top_k=1, **kwargs):
-        """
-        Postprocess model outputs to age/gender format
-        This is where LABEL_0/LABEL_1 gets converted to real predictions
-        """
-        # Extract logits from model output
-        logits = model_outputs["logits"]
-        # Get age and gender from concatenated logits
-        age_raw = logits[0, 0].item()      # First element is age
-        gender_raw = logits[0, 1].item()   # Second element is gender
-        # Apply the scaling we discovered through testing
-        # age_raw ~0.7 maps to realistic ages using this formula:
         age = int(max(18, min(70, ((age_raw - 1.5) / 1.0) * 50 + 20)))
-        # Process gender (already sigmoid'd in the model)
         gender_prob = gender_raw
         gender = "Female" if gender_prob > 0.5 else "Male"
         confidence = gender_prob if gender_prob > 0.5 else 1 - gender_prob
-        # Return in the standard pipeline format with age/gender keys
         return [{
             "label": f"{age} years, {gender}",
             "score": confidence,
@@ -150,13 +110,13 @@ class AgeGenderImageClassificationPipeline(ImageClassificationPipeline):
         }]
-# Manual functions for advanced users
-def predict_age_gender(image_path):
-    """Manual prediction function for advanced usage"""
     import torch.nn as nn
     from transformers import ViTImageProcessor, ViTModel
-    class SimpleAgeGenderModel(nn.Module):
         def __init__(self):
             super().__init__()
             self.vit = ViTModel.from_pretrained('google/vit-base-patch16-224')
@@ -181,7 +141,7 @@ def predict_age_gender(image_path):
             return age_output, gender_output
     # Load model
-    model = SimpleAgeGenderModel()
     model_url = "https://huggingface.co/abhilash88/age-gender-prediction/resolve/main/pytorch_model.bin"
     weights = torch.hub.load_state_dict_from_url(model_url, map_location='cpu')
     filtered_weights = {k: v for k, v in weights.items() if not k.startswith('classifier.')}
@@ -204,7 +164,7 @@ def predict_age_gender(image_path):
     with torch.no_grad():
         age_raw, gender_raw = model(inputs["pixel_values"])
-    # Apply same scaling as pipeline
     age_val = age_raw.item()
     age = int(max(18, min(70, ((age_val - 1.5) / 1.0) * 50 + 20)))
@@ -220,29 +180,22 @@ def predict_age_gender(image_path):
     }
-# Test function
 if __name__ == "__main__":
-    print("🧪 Testing Age-Gender Prediction Model...")
     try:
-        # Test the one-liner pipeline
         from transformers import pipeline
         classifier = pipeline("image-classification", model="abhilash88/age-gender-prediction", trust_remote_code=True)
-        # Test with a sample URL
         test_url = "https://images.unsplash.com/photo-1507003211169-0a1dd7228f2d?w=300"
         result = classifier(test_url)
-        print(f"✅ Pipeline result: {result[0]}")
-        print(f"✅ Age: {result[0]['age']}, Gender: {result[0]['gender']}")
-        # Test manual approach
-        manual_result = predict_age_gender(test_url)
-        print(f"✅ Manual result: {manual_result['summary']}")
-        print("🎉 TRUE ONE-LINER WORKING!")
     except Exception as e:
-        print(f"❌ Error: {e}")
-        print("Upload the corrected files to enable the one-liner")

 """
+Age-Gender Prediction Model - Simplified Working Version
+Uses standard ViT model_type to avoid CONFIG_MAPPING issues
+EXACT Usage:
 from transformers import pipeline
 classifier = pipeline("image-classification", model="abhilash88/age-gender-prediction", trust_remote_code=True)
 result = classifier("image.jpg")
 from transformers import (
     ViTModel,
     ViTImageProcessor,
+    ViTPreTrainedModel,
+    ViTConfig,
+    ImageClassificationPipeline
 )
 from PIL import Image
 import numpy as np
+class AgeGenderViTModel(ViTPreTrainedModel):
+    """Age-Gender ViT Model using standard ViT architecture"""
+    def __init__(self, config):
         super().__init__(config)
+        self.vit = ViTModel(config, add_pooling_layer=False)
         # Age head: 768 → 256 → 64 → 1
         self.age_head = nn.Sequential(
+            nn.Linear(config.hidden_size, 256),
+            nn.ReLU(),
+            nn.Dropout(0.1),
+            nn.Linear(256, 64),
+            nn.ReLU(),
+            nn.Dropout(0.1),
             nn.Linear(64, 1)
         )
         # Gender head: 768 → 256 → 64 → 1
         self.gender_head = nn.Sequential(
+            nn.Linear(config.hidden_size, 256),
+            nn.ReLU(),
+            nn.Dropout(0.1),
+            nn.Linear(256, 64),
+            nn.ReLU(),
+            nn.Dropout(0.1),
+            nn.Linear(64, 1),
+            nn.Sigmoid()
         )
+        # Standard classifier for compatibility
+        self.classifier = nn.Linear(config.hidden_size, 2)
+        # Initialize weights
+        self.post_init()
+    def forward(self, pixel_values=None, **kwargs):
         """Forward pass returning logits for pipeline"""
+        # Get ViT outputs
+        outputs = self.vit(pixel_values=pixel_values, **kwargs)
+        # Use the last hidden state and pool it
+        sequence_output = outputs[0]
+        pooled_output = sequence_output[:, 0]  # Use [CLS] token
+        # Get age and gender predictions
         age_output = self.age_head(pooled_output)
         gender_output = self.gender_head(pooled_output)
+        # Create logits for pipeline
         logits = torch.cat([age_output, gender_output], dim=1)
         return {"logits": logits}
 class AgeGenderImageClassificationPipeline(ImageClassificationPipeline):
+    """Custom pipeline that converts model outputs to age/gender"""
     def postprocess(self, model_outputs, top_k=1, **kwargs):
+        """Convert logits to age/gender predictions"""
+        # Extract logits
+        logits = model_outputs["logits"]
+        age_raw = logits[0, 0].item()
+        gender_raw = logits[0, 1].item()
+        # Apply scaling discovered through testing
         age = int(max(18, min(70, ((age_raw - 1.5) / 1.0) * 50 + 20)))
+        # Process gender
         gender_prob = gender_raw
         gender = "Female" if gender_prob > 0.5 else "Male"
         confidence = gender_prob if gender_prob > 0.5 else 1 - gender_prob
+        # Return standard pipeline format
         return [{
             "label": f"{age} years, {gender}",
             "score": confidence,
         }]
+# Helper function for manual usage
+def predict_age_gender_manual(image_path):
+    """Manual prediction without pipeline"""
     import torch.nn as nn
     from transformers import ViTImageProcessor, ViTModel
+    class SimpleModel(nn.Module):
         def __init__(self):
             super().__init__()
             self.vit = ViTModel.from_pretrained('google/vit-base-patch16-224')
             return age_output, gender_output
     # Load model
+    model = SimpleModel()
     model_url = "https://huggingface.co/abhilash88/age-gender-prediction/resolve/main/pytorch_model.bin"
     weights = torch.hub.load_state_dict_from_url(model_url, map_location='cpu')
     filtered_weights = {k: v for k, v in weights.items() if not k.startswith('classifier.')}
     with torch.no_grad():
         age_raw, gender_raw = model(inputs["pixel_values"])
+    # Apply scaling
     age_val = age_raw.item()
     age = int(max(18, min(70, ((age_val - 1.5) / 1.0) * 50 + 20)))
     }
 if __name__ == "__main__":
+    print("🧪 Testing simplified Age-Gender model...")
     try:
         from transformers import pipeline
+        # Test pipeline
         classifier = pipeline("image-classification", model="abhilash88/age-gender-prediction", trust_remote_code=True)
         test_url = "https://images.unsplash.com/photo-1507003211169-0a1dd7228f2d?w=300"
         result = classifier(test_url)
+        print(f"✅ Pipeline: Age {result[0]['age']}, Gender {result[0]['gender']}")
+        # Test manual
+        manual_result = predict_age_gender_manual(test_url)
+        print(f"✅ Manual: {manual_result['summary']}")
     except Exception as e:
+        print(f"❌ Error: {e}")