image_demo.py


#%% 
# Importing necessary basic libraries and modules
import numpy as np
import os
from PIL import Image

#%% 
# PyTorch imports 
import torch
#%% 
# Importing the model, dataset, transformations and utility functions from PytorchWildlife
from PytorchWildlife.models import detection as pw_detection
from PytorchWildlife.data import transforms as pw_trans
from PytorchWildlife import utils as pw_utils


def pw_detect(im_file, new_file, threshold=None, pre_detects=None, diff_reasoning=False, verbose=False):

    if not isinstance(threshold, float):
        threshold = 0.2

    classify = False
    
    #%% 
    # Setting the device to use for computations ('cuda' indicates GPU)
    DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
    if verbose:
        print(DEVICE)
        print(f"Threshold: {threshold}")
    #%% 
    # Initializing the MegaDetectorV5 model for image detection
    detection_model = pw_detection.MegaDetectorV5(device=DEVICE, pretrained=True)

    #%% Single image detection
    # Specifying the path to the target image TODO: Allow argparsing

    # Opening and converting the image to RGB format
    img = np.array(Image.open(im_file).convert("RGB"))

    # Initializing the Yolo-specific transform for the image
    transform = pw_trans.MegaDetector_v5_Transform(target_size=detection_model.IMAGE_SIZE,
                                                stride=detection_model.STRIDE)

    new_file_path = os.path.dirname(new_file)

    # Performing the detection on the single image
    result = detection_model.single_image_detection(transform(img), img.shape, im_file, conf_thres=threshold)
    
    #result['img_id'] = result['img_id'].replace("\\","/")

    if diff_reasoning and pre_detects is not None:
        # extract values of bounding boxes from the result dictionary
        bounding_boxes = result['detections'].xyxy
        prev_bounding_boxes = pre_detects.xyxy
        # if bounding boxes heardly change, then animal change into blank
        if len(bounding_boxes) == len(prev_bounding_boxes):
            for i in range(len(bounding_boxes)):
                if (abs(bounding_boxes[i][0] - prev_bounding_boxes[i][0]) < 5 and
                    abs(bounding_boxes[i][1] - prev_bounding_boxes[i][1]) < 5 and
                    abs(bounding_boxes[i][2] - prev_bounding_boxes[i][2]) < 5 and
                    abs(bounding_boxes[i][3] - prev_bounding_boxes[i][3]) < 5):
                    print(f"bounding boxes:{bounding_boxes[i]}")
                    print(f"previous bounding boxes:{prev_bounding_boxes[i]}")
                    print("bounding box not move, change to blank")
                    #transform animal in the labels to 'blank'
                    result['labels'][i] = "blank"

    # Saving the detection results 
    animal_n = sum('animal' in item for item in result['labels'])
    print(f'{im_file} has {animal_n} animals')
    result['object'] = animal_n

    try:
        img = Image.open(im_file)
        exif_data = img._getexif()
        result['eventStart']  = exif_data[36867]
        result['eventEnd'] = exif_data[36867]
        result["Make"] = exif_data[271]
    except:
        result['eventStart'] = "None"
        result['eventEnd'] = "None"
        result["Make"] = None

    if animal_n > 0:
        if verbose:
            print(f"Saving detection images to {new_file_path}")
            print(result)
        pw_utils.save_detection_images(result, new_file_path)
        if classify:
            try:
                animalclass = Classifier(model_dir=os.getcwd())
                sp, conf = animalclass.run_prediction(result, img)
                result['name'] = sp
                result['sp_confidence'] = conf
            except Exception as e:
                print(f"Error in classification: {e}")
                result['name'] = "False"
                result['sp_confidence'] = "False"
    
    return result