Spaces:

HMWCS
/

Gemma3n-challenge-demo

Running on Zero

App Files Files Community

HMWCS commited on Aug 1

Commit

b770303

verified ·

1 Parent(s): dc8106e

feat: delete images

Browse files

Files changed (9) hide show

test_images/cardboard1.jpg +0 -0
test_images/classifier.py +0 -475
test_images/electronic_ewaste.jpg +0 -0
test_images/glass2.jpg +0 -0
test_images/knowledge_base.py +0 -87
test_images/metal5.jpg +0 -0
test_images/mixed-waste-mix.jpg +0 -3
test_images/open-box-pizzaweb.jpg +0 -3
test_images/toliet-paper.jpeg +0 -0

test_images/cardboard1.jpg DELETED Viewed

Binary file (17.3 kB)

test_images/classifier.py DELETED Viewed

@@ -1,475 +0,0 @@
-from transformers import AutoProcessor, AutoModelForImageTextToText
-from PIL import Image
-import torch
-import logging
-from typing import Union, Tuple
-from config import Config
-from knowledge_base import GarbageClassificationKnowledge
-import re
-def preprocess_image(image: Image.Image) -> Image.Image:
-    """
-    Preprocess image to meet Gemma3n requirements (512x512)
-    """
-    # Convert to RGB if necessary
-    if image.mode != "RGB":
-        image = image.convert("RGB")
-    # Resize to 512x512 as required by Gemma3n
-    target_size = (512, 512)
-    # Calculate aspect ratio preserving resize
-    original_width, original_height = image.size
-    aspect_ratio = original_width / original_height
-    if aspect_ratio > 1:
-        # Width is larger
-        new_width = target_size[0]
-        new_height = int(target_size[0] / aspect_ratio)
-    else:
-        # Height is larger or equal
-        new_height = target_size[1]
-        new_width = int(target_size[1] * aspect_ratio)
-    # Resize image maintaining aspect ratio
-    image = image.resize((new_width, new_height), Image.Resampling.LANCZOS)
-    # Create a new image with target size and paste the resized image
-    processed_image = Image.new(
-        "RGB", target_size, (255, 255, 255)
-    )  # White background
-    # Calculate position to center the image
-    x_offset = (target_size[0] - new_width) // 2
-    y_offset = (target_size[1] - new_height) // 2
-    processed_image.paste(image, (x_offset, y_offset))
-    return processed_image
-class GarbageClassifier:
-    def __init__(self, config: Config = None):
-        self.config = config or Config()
-        self.knowledge = GarbageClassificationKnowledge()
-        self.processor = None
-        self.model = None
-        # self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-        # Setup logging
-        logging.basicConfig(level=logging.INFO)
-        self.logger = logging.getLogger(__name__)
-    def load_model(self):
-        """Load the model and processor"""
-        try:
-            self.logger.info(f"Loading model: {self.config.MODEL_NAME}")
-            # Load processor
-            kwargs = {}
-            if self.config.HF_TOKEN:
-                kwargs["token"] = self.config.HF_TOKEN
-            self.processor = AutoProcessor.from_pretrained(
-                self.config.MODEL_NAME, **kwargs
-            )
-            # Load model
-            self.model = AutoModelForImageTextToText.from_pretrained(
-                self.config.MODEL_NAME,
-                torch_dtype=self.config.TORCH_DTYPE,
-                device_map=self.config.DEVICE_MAP,
-            )
-            self.logger.info("Model loaded successfully")
-        except Exception as e:
-            self.logger.error(f"Error loading model: {str(e)}")
-            raise
-    def classify_image(self, image: Union[str, Image.Image]) -> Tuple[str, str, int]:
-        """
-        Classify garbage in the image
-        Args:
-            image: PIL Image or path to image file
-        Returns:
-            Tuple of (classification_result, detailed_analysis, confidence_score)
-        """
-        if self.model is None or self.processor is None:
-            raise RuntimeError("Model not loaded. Call load_model() first.")
-        try:
-            # Load and process image
-            if isinstance(image, str):
-                image = Image.open(image)
-            elif not isinstance(image, Image.Image):
-                raise ValueError("Image must be a PIL Image or file path")
-            # Preprocess image to meet Gemma3n requirements
-            processed_image = preprocess_image(image)
-            # Prepare messages with system prompt and user query
-            messages = [
-                {
-                    "role": "system",
-                    "content": [
-                        {
-                            "type": "text",
-                            "text": self.knowledge.get_system_prompt(),
-                        }
-                    ],
-                },
-                {
-                    "role": "user",
-                    "content": [
-                        {"type": "image", "image": processed_image},
-                        {
-                            "type": "text",
-                            "text": "Please classify what you see in this image. If it shows garbage/waste items, classify them according to the garbage classification standards. If it shows people, living things, or other non-waste items, classify it as 'Unable to classify' and explain why it's not garbage. Also provide a confidence score from 1-10 indicating how certain you are about your classification.",
-                        },
-                    ],
-                },
-            ]
-            # Apply chat template and tokenize
-            inputs = self.processor.apply_chat_template(
-                messages,
-                add_generation_prompt=True,
-                tokenize=True,
-                return_dict=True,
-                return_tensors="pt",
-            ).to(self.model.device, dtype=self.model.dtype)
-            input_len = inputs["input_ids"].shape[-1]
-            outputs = self.model.generate(
-                **inputs,
-                max_new_tokens=self.config.MAX_NEW_TOKENS,
-                disable_compile=True,
-            )
-            response = self.processor.batch_decode(
-                outputs[:, input_len:],
-                skip_special_tokens=True,
-            )[0]
-            # Extract classification from response
-            classification = self._extract_classification(response)
-            # Extract reasoning from response
-            reasoning = self._extract_reasoning(response)
-            # Extract confidence score from response
-            confidence_score = self._extract_confidence_score(response, classification)
-            return classification, reasoning, confidence_score
-        except Exception as e:
-            self.logger.error(f"Error during classification: {str(e)}")
-            import traceback
-            traceback.print_exc()
-            return "Error", f"Classification failed: {str(e)}", 0
-    def _calculate_confidence_heuristic(self, response_lower: str, classification: str) -> int:
-        """Calculate confidence based on response content and classification type"""
-        base_confidence = 5
-        # Confidence indicators (increase confidence)
-        high_confidence_words = ["clearly", "obviously", "definitely", "certainly", "exactly"]
-        medium_confidence_words = ["appears", "seems", "likely", "probably"]
-        # Uncertainty indicators (decrease confidence)
-        uncertainty_words = ["might", "could", "possibly", "maybe", "unclear", "difficult"]
-        # Adjust based on confidence words
-        for word in high_confidence_words:
-            if word in response_lower:
-                base_confidence += 2
-                break
-        for word in medium_confidence_words:
-            if word in response_lower:
-                base_confidence += 1
-                break
-        for word in uncertainty_words:
-            if word in response_lower:
-                base_confidence -= 2
-                break
-        # Classification-specific adjustments
-        if classification == "Unable to classify":
-            if any(indicator in response_lower for indicator in ["person", "people", "human", "living"]):
-                base_confidence += 1  # High confidence when clearly not waste
-            else:
-                base_confidence -= 1  # Lower confidence for unclear items
-        elif classification == "Error":
-            base_confidence = 1
-        else:
-            # Check for specific material mentions (increases confidence)
-            specific_materials = ["aluminum", "plastic", "glass", "metal", "cardboard", "paper"]
-            if any(material in response_lower for material in specific_materials):
-                base_confidence += 1
-        return min(max(base_confidence, 1), 10)
-    def _extract_confidence_score(self, response: str, classification: str) -> int:
-        """Extract confidence score from response or calculate based on classification"""
-        response_lower = response.lower()
-        # Look for explicit confidence scores in the response
-        confidence_patterns = [
-            r'confidence[:\s]*(\d+)',
-            r'confident[:\s]*(\d+)',
-            r'certainty[:\s]*(\d+)',
-            r'score[:\s]*(\d+)',
-            r'(\d+)/10',
-            r'(\d+)\s*out\s*of\s*10'
-        ]
-        for pattern in confidence_patterns:
-            match = re.search(pattern, response_lower)
-            if match:
-                score = int(match.group(1))
-                return min(max(score, 1), 10)  # Clamp between 1-10
-        # If no explicit score found, calculate based on classification indicators
-        return self._calculate_confidence_heuristic(response_lower, classification)
-    def _extract_classification(self, response: str) -> str:
-        """Extract the main classification from the response with STRICT mixed garbage enforcement"""
-        response_lower = response.lower()
-        # STRICT MIXED GARBAGE ENFORCEMENT - Catch ANY mixed scenario
-        # 1. Explicit mixed garbage phrases
-        explicit_mixed_phrases = [
-            "multiple garbage types",
-            "multiple different",
-            "different types of garbage",
-            "various items",
-            "mixed items",
-            "several different",
-            "collection of mixed items",
-            "mixture of items",
-            "variety of items",
-            "separate items",
-            "please separate"
-        ]
-        if any(phrase in response_lower for phrase in explicit_mixed_phrases):
-            return "Unable to classify"
-        # 2. Language patterns that indicate multiple items/uncertainty about classification
-        uncertainty_patterns = [
-            "appears to be containers",
-            "what appears to be",
-            "including what appears",
-            "various colors and textures",
-            "don't clearly fall into a single",
-            "without further detail",
-            "not possible to definitively classify",
-            "more information",
-            "can't determine",
-            "difficult to identify",
-            "unclear category",
-            "mixed materials"
-        ]
-        if any(pattern in response_lower for pattern in uncertainty_patterns):
-            return "Unable to classify"
-        # 3. Multiple container/item indicators
-        multiple_item_indicators = [
-            "containers (", "bottles, cans", "bags, and", "items, including",
-            "bottles and", "cans and", "containers and", "bags and",
-            "plastic bottles, cans", "various containers"
-        ]
-        if any(indicator in response_lower for indicator in multiple_item_indicators):
-            return "Unable to classify"
-        # 4. Count different item types mentioned
-        item_types = [
-            "bottle", "can", "container", "bag", "box", "wrapper",
-            "jar", "cup", "plate", "bowl", "package"
-        ]
-        item_count = sum(1 for item_type in item_types if item_type in response_lower)
-        if item_count >= 3:  # If 3+ different container types mentioned, it's mixed
-            return "Unable to classify"
-        # ONLY EXCEPTION: Single recyclable container with visible food content
-        recyclable_container_indicators = ["container", "bottle", "can", "jar", "box", "wrapper"]
-        food_content_indicators = [
-            "food residue", "food content", "food inside", "visible food",
-            "remains", "leftovers", "scraps inside", "not empty", "not rinsed"
-        ]
-        recyclable_material_indicators = ["plastic", "aluminum", "glass", "metal", "cardboard"]
-        # Check for recycling tip warning
-        has_recycling_tip = any(tip in response_lower for tip in [
-            "tip: empty and rinse",
-            "empty and rinse this container",
-            "clean first", "rinse first"
-        ])
-        # ONLY allow Food/Kitchen classification for single contaminated container
-        has_single_container = any(indicator in response_lower for indicator in recyclable_container_indicators)
-        has_food_content = any(indicator in response_lower for indicator in food_content_indicators)
-        has_recyclable_material = any(indicator in response_lower for indicator in recyclable_material_indicators)
-        # Must be single item (not multiple) and contaminated
-        if (has_single_container and has_food_content and
-                (has_recyclable_material or has_recycling_tip) and
-                item_count <= 1):  # Only single container
-            return "Food/Kitchen Waste"
-        # Now proceed with normal classification for single, clear items
-        categories = self.knowledge.get_categories()
-        waste_categories = [cat for cat in categories if cat != "Unable to classify"]
-        for category in waste_categories:
-            if category.lower() in response_lower:
-                category_index = response_lower.find(category.lower())
-                context_before = response_lower[max(0, category_index - 30):category_index]
-                if not any(neg in context_before[-10:] for neg in ["not", "cannot", "isn't", "doesn't"]):
-                    return category
-        # Single item material detection
-        recyclable_indicators = ["recyclable", "recycle", "aluminum", "plastic", "glass", "metal", "foil", "cardboard",
-                                 "paper"]
-        if any(indicator in response_lower for indicator in recyclable_indicators):
-            if not any(cont in response_lower for cont in food_content_indicators):
-                return "Recyclable Waste"
-        # Food waste indicators
-        food_indicators = ["food", "fruit", "vegetable", "organic", "kitchen waste", "peel", "core", "scraps"]
-        if any(indicator in response_lower for indicator in food_indicators):
-            return "Food/Kitchen Waste"
-        # Hazardous waste indicators
-        hazardous_indicators = ["battery", "chemical", "medicine", "paint", "toxic", "hazardous"]
-        if any(indicator in response_lower for indicator in hazardous_indicators):
-            return "Hazardous Waste"
-        # Other waste indicators
-        other_waste_indicators = ["cigarette", "ceramic", "dust", "diaper", "tissue"]
-        if any(indicator in response_lower for indicator in other_waste_indicators):
-            return "Other Waste"
-        # Non-garbage detection
-        unable_phrases = ["unable to classify", "cannot classify", "not garbage", "not waste"]
-        if any(phrase in response_lower for phrase in unable_phrases):
-            return "Unable to classify"
-        non_garbage_indicators = ["person", "people", "human", "face", "living", "animal", "pet"]
-        if any(indicator in response_lower for indicator in non_garbage_indicators):
-            return "Unable to classify"
-        # Default fallback
-        return "Unable to classify"
-    def _extract_reasoning(self, response: str) -> str:
-        """Extract only the reasoning content, removing all formatting markers and classification info"""
-        import re
-        # Remove all formatting markers
-        cleaned_response = response.replace("**Classification**:", "")
-        cleaned_response = cleaned_response.replace("**Reasoning**:", "")
-        cleaned_response = re.sub(r'\*\*.*?\*\*:', '', cleaned_response)  # Remove any **text**: patterns
-        cleaned_response = cleaned_response.replace("**", "")  # Remove remaining ** markers
-        # Remove category names that might appear at the beginning
-        categories = self.knowledge.get_categories()
-        for category in categories:
-            if cleaned_response.strip().startswith(category):
-                cleaned_response = cleaned_response.replace(category, "", 1)
-                break
-        # Remove common material names that might appear at the beginning
-        material_names = [
-            "Glass", "Plastic", "Metal", "Paper", "Cardboard", "Aluminum",
-            "Steel", "Iron", "Tin", "Foil", "Wood", "Ceramic", "Fabric",
-            "Recyclable Waste", "Food/Kitchen Waste", "Hazardous Waste", "Other Waste"
-        ]
-        # Clean the response
-        cleaned_response = cleaned_response.strip()
-        # Remove material names at the beginning
-        for material in material_names:
-            if cleaned_response.startswith(material):
-                # Remove the material name and any following punctuation/whitespace
-                cleaned_response = cleaned_response[len(material):].lstrip(" .,;:")
-                break
-        # Split into sentences and clean up
-        sentences = []
-        # Split by common sentence endings, but keep the endings
-        parts = re.split(r'([.!?])\s+', cleaned_response)
-        # Rejoin parts to maintain sentence structure
-        reconstructed_parts = []
-        for i in range(0, len(parts), 2):
-            if i < len(parts):
-                sentence = parts[i]
-                if i + 1 < len(parts):
-                    sentence += parts[i + 1]  # Add the punctuation back
-                reconstructed_parts.append(sentence)
-        for part in reconstructed_parts:
-            part = part.strip()
-            if not part:
-                continue
-            # Skip parts that are just category names or material names
-            if part in categories or part.rstrip(".,;:") in material_names:
-                continue
-            # Skip parts that start with category names or material names
-            is_category_line = False
-            for item in categories + material_names:
-                if part.startswith(item):
-                    is_category_line = True
-                    break
-            if is_category_line:
-                continue
-            # Clean up the sentence
-            part = re.sub(r'^[A-Za-z\s]+:', '', part).strip()  # Remove "Category:" type prefixes
-            if part and len(part) > 3:  # Only keep meaningful content
-                sentences.append(part)
-        # Join sentences
-        reasoning = ' '.join(sentences)
-        # Final cleanup - remove any remaining standalone material words at the beginning
-        reasoning_words = reasoning.split()
-        if reasoning_words and reasoning_words[0] in [m.lower() for m in material_names]:
-            reasoning_words = reasoning_words[1:]
-            reasoning = ' '.join(reasoning_words)
-        # Ensure proper capitalization
-        if reasoning:
-            reasoning = reasoning[0].upper() + reasoning[1:] if len(reasoning) > 1 else reasoning.upper()
-            # Ensure proper punctuation
-            if not reasoning.endswith(('.', '!', '?')):
-                reasoning += '.'
-        return reasoning if reasoning else "Analysis not available"
-    def get_categories_info(self):
-        """Get information about all categories"""
-        return self.knowledge.get_category_descriptions()

test_images/electronic_ewaste.jpg DELETED Viewed

Binary file (24.3 kB)

test_images/glass2.jpg DELETED Viewed

Binary file (11 kB)

test_images/knowledge_base.py DELETED Viewed

@@ -1,87 +0,0 @@
-class GarbageClassificationKnowledge:
-    @staticmethod
-    def get_system_prompt():
-        return """You are a professional garbage classification expert. You need to carefully observe the items in the picture, analyze their materials, properties and uses, and then make accurate judgments according to garbage classification standards.
-IMPORTANT: You should ONLY classify items that are actually garbage/waste. If the image contains people, living things, furniture, electronics in use, or other non-waste items, you should classify it as "Unable to classify" and explain that it's not garbage.
-**MIXED GARBAGE HANDLING RULES:**
-1. **Containers with Food Content**: For any recyclable container (aluminum cans, glass jars, clean plastic bottles, etc.) that contains visible food residue or content:
-   - Classify as "Food/Kitchen Waste" due to contamination risk
-   - Always include this warning: "⚠️ Tip: Empty and rinse this container first, then it can be recycled!"
-   - Only completely empty and rinsed containers qualify as "Recyclable Waste"
-   - Non-recyclable containers (styrofoam, wax-coated) with food: classify as "Food/Kitchen Waste" with warning: "⚠️ Tip: Remove food waste for composting, then dispose container in general trash"
-2. **Multiple Different Garbage Types**: If the image shows multiple different types of garbage mixed together (e.g., electronics with food, batteries with organic waste):
-   - Classify as "Unable to classify"
-   - Include warning: "⚠️ Warning: Multiple garbage types detected. Please separate items for proper classification."
-Garbage classification standards:
-**Recyclable Waste**:
-- Paper: newspapers, magazines, books, various packaging papers, office paper, advertising flyers, clean cardboard boxes, copy paper, etc.
-- Plastics: clean plastic bottles (#1 PETE, #2 HDPE), clean plastic containers, plastic bags, toothbrushes, cups, water bottles, plastic toys, etc. (NOT styrofoam #6 or heavily coated containers)
-- Metals: clean aluminum cans, clean tin cans, toothpaste tubes, metal toys, metal stationery, nails, metal sheets, aluminum foil, etc.
-- Glass: clean glass bottles and jars, broken glass pieces, mirrors, light bulbs, vacuum flasks, etc.
-- Textiles: old clothing, textile products, shoes, curtains, towels, bags, etc.
-- NOTE: Only clean, empty containers qualify. Contaminated containers go to Food/Kitchen Waste. Wax-coated containers, styrofoam, and multi-material packaging are NOT recyclable.
-**Food/Kitchen Waste**:
-- Food scraps: rice, noodles, bread, meat, fish, shrimp shells, crab shells, bones, etc.
-- Fruit peels and cores: watermelon rinds, apple cores, orange peels, banana peels, nut shells, etc.
-- Plants: withered branches and leaves, flowers, traditional Chinese medicine residue, etc.
-- Expired food: expired canned food, cookies, candy, etc.
-- Contaminated containers: any container with visible food residue or content
-**Hazardous Waste**:
-- Batteries: dry batteries, rechargeable batteries, button batteries, and all types of batteries
-- Light tubes: energy-saving lamps, fluorescent tubes, incandescent bulbs, LED lights, etc.
-- Pharmaceuticals: expired medicines, medicine packaging, thermometers, blood pressure monitors, etc.
-- Paints: paint, coatings, glue, nail polish, cosmetics, etc.
-- Others: pesticides, cleaning agents, agricultural chemicals, X-ray films, etc.
-**Other Waste**:
-- Contaminated non-recyclable paper: toilet paper, diapers, wet wipes, napkins, etc.
-- Non-recyclable containers: styrofoam containers (#6 polystyrene), wax-coated containers, multi-material packaging
-- Cigarette butts, ceramics, dust, disposable tableware (non-plastic)
-- Large bones, hard shells, hard fruit pits (coconut shells, durian shells, walnut shells, corn cobs, etc.)
-- Hair, pet waste, cat litter, etc.
-**Unable to classify**:
-- People, human faces, human body parts
-- Living animals, pets
-- Furniture, appliances, electronics in normal use
-- Buildings, landscapes, vehicles
-- Any item that is not intended to be discarded as waste
-- Multiple different garbage types mixed together
-Please observe the items in the image carefully according to the above classification standards. If the image shows garbage/waste items, provide accurate garbage classification results. If the image does NOT show garbage/waste (e.g., people, living things, functioning items), classify it as "Unable to classify" and explain why it's not garbage.
-For mixed garbage situations, apply the special handling rules above and include appropriate warnings.
-Format your response EXACTLY as follows:
-**Classification**: [Category Name or "Unable to classify"]
-**Reasoning**: [Brief explanation of why this item belongs to this category, or why it cannot be classified as garbage]
-**Confidence Score**: [Number from 1-10]"""
-    @staticmethod
-    def get_categories():
-        return [
-            "Recyclable Waste",
-            "Food/Kitchen Waste",
-            "Hazardous Waste",
-            "Other Waste",
-            "Unable to classify",
-        ]
-    @staticmethod
-    def get_category_descriptions():
-        return {
-            "Recyclable Waste": "Items that can be processed and reused, including paper, plastic, metal, glass, and textiles (must be clean and empty)",
-            "Food/Kitchen Waste": "Organic waste from food preparation and consumption, including contaminated containers",
-            "Hazardous Waste": "Items containing harmful substances that require special disposal",
-            "Other Waste": "Items that don't fit into other categories and go to general waste",
-            "Unable to classify": "Items that are not garbage/waste, such as people, living things, functioning objects, or mixed garbage types",
-        }

test_images/metal5.jpg DELETED Viewed

Binary file (22.3 kB)

test_images/mixed-waste-mix.jpg DELETED Viewed

Git LFS Details

SHA256: 75b5d948bea8c8ff4753b7a9e51d2c5087f49bed2194c6dcfbdf3358322f77fd
Pointer size: 131 Bytes
Size of remote file: 151 kB

test_images/open-box-pizzaweb.jpg DELETED Viewed

Git LFS Details

SHA256: 53f57a45a193aea7c042a9a6cb07af7f6de1176ad02f9ef6ef0da58d09b2713b
Pointer size: 131 Bytes
Size of remote file: 111 kB

test_images/toliet-paper.jpeg DELETED Viewed

Binary file (3.07 kB)