toothbrush_head_final_visualize.py

## checklist

## file hwakjangja..  .jpg or .png or .bmp
## test_dir name!! check test_dir in visualize.py too!


import os
os.environ["CUDA_DEVICE_ORDER"] = "PCI_BUS_ID"
os.environ['CUDA_VISIBLE_DEVICES'] = "0"

import sys
import json
import datetime
import numpy as np
import skimage.draw
import pandas as pd
import cv2
import re
import random

from keras.preprocessing.image import ImageDataGenerator
from keras.models import Sequential
from keras.layers import Dense
from keras.optimizers import Adam
import time
import tensorflow as tf
from efficientnet.keras import EfficientNetB3, EfficientNetB0
from keras.models import load_model
from sklearn.metrics import confusion_matrix
import csv

# Root directory of the project
ROOT_DIR = os.path.abspath("../")

# Import Mask RCNN
from PIL import Image

sys.path.append(ROOT_DIR)  # To find local version of the library
from mrcnn.config import Config
from mrcnn import model as modellib, utils
from mrcnn import abrush_visualize
import time

# Directory to save logs and model checkpoints, if not provided
# through the command line argument --logs
# DEFAULT_LOGS_DIR = os.path.join(ROOT_DIR, "logs")
DEFAULT_LOGS_DIR = "./logs"
DEFAULT_IMAGE_DIR = './datasets/brush'
DEFAULT_MRCNN_MODEL_DIR = './models/brush/mask_rcnn_toothbrush_head_0020.h5'
DEFAULT_EFF_MODEL_DIR = './models/brush/efficient-best_weight_220119_2.h5'

total_start = time.time()
############################################################
#  Configurations
############################################################


class ToothBrushHeadConfig(Config):
    """Configuration for training on the toy  dataset.
    Derives from the base Config class and overrides some values.
    """
    # Give the configuration a recognizable name
    NAME = "toothbrush_head"

    # We use a GPU with 12GB memory, which can fit two images.
    # Adjust down if you use a smaller GPU.
    IMAGES_PER_GPU = 2

    # Number of classes (including background)
    NUM_CLASSES = 1 + 1  # Background + balloon

    # Number of training steps per epoch
    STEPS_PER_EPOCH = 100

    # Skip detections with < 90% confidence
    DETECTION_MIN_CONFIDENCE = 0.9


############################################################
#  Dataset
############################################################

def color_splash(image, mask):
    """Apply color splash effect.
    image: RGB image [height, width, 3]
    mask: instance segmentation mask [height, width, instance count]

    Returns result image.
    """
    # Make a grayscale copy of the image. The grayscale copy still
    # has 3 RGB channels, though.
    gray = skimage.color.gray2rgb(skimage.color.rgb2gray(image)) * 255
    # Copy color pixels from the original color image where mask is set
    if mask.shape[-1] > 0:
        # We're treating all instances as one, so collapse the mask into one layer
        mask = (np.sum(mask, -1, keepdims=True) >= 1)
        splash = np.where(mask, image, gray).astype(np.uint8)
    else:
        splash = gray.astype(np.uint8)
    return splash

detect_time = []
def detect_and_color_splash(model, image_path=None, img_file_name=None):
    assert image_path

    print("Running on {}".format(image_path))
    # Read image
    image = skimage.io.imread(image_path)

    # Detect objects
    # Run model detection and generate the color splash effect
    start_inference = time.time()
    r = model.detect([image], verbose=1)[0]

    ## check time for inference
    end_inference = time.time()
    dd_time = end_inference - start_inference
    dd_time = np.floor(dd_time*10) / 10
    if "dummy" not in img_file_name:
        print("inference_time :", dd_time," sec for", img_file_name)
        detect_time.append(dd_time)

    # bounding box visualize
    class_names = ['background', 'defect']
    bbox = utils.extract_bboxes(r['masks'])
    file_name_bb = "bb_splash_{}".format(img_file_name)
    save_path_bb = os.path.join(DEFAULT_IMAGE_DIR, 'result', file_name_bb)

    # print("image_path", image_path)

    bv = abrush_visualize.display_instances(save_path_bb, image_path, image, bbox, r['masks'], r['class_ids'], class_names, r['scores'])
    #brush_visualize.display_instances(save_path_bb, image_path, image, bbox, r['masks'], r['class_ids'], class_names, r['scores'])

    # print("points : ", bv) 
    ############## show input iamge #############
    #display_img = cv2.imread(image_path, 3) 
    #display_img = cv2.resize(display_img, (int(display_img.shape[1]*0.4), int(display_img.shape[0]*0.4)))

    # cv2.imshow("input image", display_img)

    ##########################################################
    
    splash = color_splash(image, r['masks'])
    # Save output
    file_name = "splash_{}".format(img_file_name)
    save_path = os.path.join(DEFAULT_IMAGE_DIR , 'result', file_name)
    skimage.io.imsave(save_path, splash)
    
    #display_splash = splash.copy()
    #display_splash = cv2.resize(display_splash, (int(display_splash.shape[1]*0.4), int(display_splash.shape[0]*0.4)))
    #cv2.imshow("splash", display_splash)
    #cv2.waitKey(3)
    
    print("Saved to ", save_path)
    return bv

#result =[]
############################################################
#  sort filenames by human order
############################################################

def atoi(text):
    return int(text) if text.isdigit() else text

def natural_keys(text):
    return [ atoi(c) for c in re.split(r'(\d+)', text) ]


############################################################
#  classification
############################################################

class_time = []

def binary_classification(imgname, model, points):
    test_dir = os.path.join(DEFAULT_IMAGE_DIR+'/cropped/'+imgname)
    cnt_cropped = os.path.join(test_dir+'/test')
    cropped = len(os.listdir(cnt_cropped))

    path = "/home/yjkim/NOAH/gongin/datasets/brush/result/"
    res_path = os.path.join(path+'bb_splash_'+imgname+'.png')
    
    or_path = "/home/yjkim/NOAH/gongin/datasets/brush/test/"
    ori_path = os.path.join(or_path + imgname+'.bmp')
        
    res_img = cv2.imread(ori_path, 3)
    input_img = res_img.copy()
    bb_img = cv2.imread(res_path, 3)      
        
  
    if cropped == 25 or cropped == 34:
        test_datagen = ImageDataGenerator(
            rescale=1 / 255
        )

        test_generator = test_datagen.flow_from_directory(
            test_dir,
            target_size=(32, 32),
            batch_size=1,
            shuffle=False,
            class_mode=None
        )
        
        #print("check filenames : ", test_generator.filenames)
        start_classification = time.time()
        preds = model.predict_generator(test_generator, steps=len(test_generator.filenames))

        end_classification = time.time()

        ## check time
        inference_time = end_classification - start_classification
        inference_time = np.floor(inference_time *10) /10
        if "dummy" not in imgname:
            print(inference_time," sec for inferencing toothbrush hair")
            class_time.append(inference_time)

        
        test_generator.filenames.sort(key=natural_keys)
        # print("after sort : ", test_generator.filenames)
        # print(preds)
        image_ids = [name.split('/')[-1] for name in test_generator.filenames]
        predictions = preds.flatten()

        error = []
        cnt = []
        for i in range(len(test_generator.filenames)):
            if predictions[i] > 0.5:
                error.append('error')
                cnt.append(i)
            else:
                error.append('normal')

        data = {'filename': image_ids, 'true_label': test_generator.classes, 'category': error}

        submission = pd.DataFrame(data)
        
        for i in cnt:
            x1,x2,y1,y2 = points[i]
            print(f"(x1, y1) = ({x1}, {y1}), (x2, y2) = ({x2}, {y2})")
            cv2.rectangle(res_img, (x1,y1), (x2,y2), (0,0,255), 2)
            
       # text and bbox on result image 
        
        res_img = cv2.resize(res_img, (int(res_img.shape[1]*0.5), int(res_img.shape[0]*0.5)))
        bb_img = cv2.resize(bb_img, (int(bb_img.shape[1]*0.5), int(bb_img.shape[0]*0.5)))
        input_img = cv2.resize(input_img, (int(input_img.shape[1]*0.5), int(input_img.shape[0]*0.5)))
        res_img = cv2.putText(res_img, f"{len(cnt)} error brush detected", (200,100), cv2.FONT_HERSHEY_PLAIN, 3, (0,0,255), 2)
        
        cv2.imwrite(f"/home/yjkim/NOAH/gongin/datasets/brush/result/bbox_{imgname}.png", res_img)
        cv2.imwrite(f"/home/yjkim/NOAH/gongin/datasets/brush/result/bb_text_{imgname}.png", bb_img)
        
        print(f"brush number {cnt} is error") 
        
        cv2.imshow("input image", input_img)
        cv2.imshow("detected image", bb_img)
        cv2.imshow("result image", res_img)
            
        while(True):
            if cv2.waitKey(1)&0xFF == ord('x'):
                cv2.destroyAllWindows()
                break
        
        # final classification! whether error or not
        if (submission['category'] == 'error').any():
            print(imgname,"is error tooth brush")
            return 0

        else:
            return 1
        

    else:
        inference_time = 0
        class_time.append(inference_time)
        print(round(inference_time,2), " sec for inferencing toothbrush hair")

        # text on result image 
        # 식모 갯수보다 더 잡았을때 => 식모가 너무 불규칙해서 에러로 잡는 경우
        res_img = cv2.putText(res_img, f"more brush detected", (200,100), cv2.FONT_HERSHEY_PLAIN, 3, (0,0,255), 2)
        res_img = cv2.resize(res_img, (int(res_img.shape[1]*0.5), int(res_img.shape[0]*0.5)))
        input_img = cv2.resize(input_img, (int(input_img.shape[1]*0.5), int(input_img.shape[0]*0.5)))
        
        cv2.imshow("input image", input_img)
        cv2.imshow("result image", res_img)
        while (True):
            if cv2.waitKey(1) & 0xFF == ord('x'):
                cv2.destroyAllWindows()
                break
        
        #cv2.waitKey(3)
        
        
        return 0
############################################################
#  main
############################################################

if __name__ == '__main__':

    class InferenceConfig(ToothBrushHeadConfig):
        # Set batch size to 1 since we'll be running inference on
        # one image at a time. Batch size = GPU_COUNT * IMAGES_PER_GPU
        GPU_COUNT = 1
        IMAGES_PER_GPU = 1


    config = InferenceConfig()

    config.display()
    #####

    result_path = DEFAULT_IMAGE_DIR+'/result'
    cropped_path = DEFAULT_IMAGE_DIR+'/cropped'

    if not os.path.isdir(result_path):
        os.mkdir(DEFAULT_IMAGE_DIR+'/result')
        os.mkdir(DEFAULT_IMAGE_DIR+'/cropped')


################# LOAD MODELS #######################
    #### MASK-R-CNN
    mrcnn_model = modellib.MaskRCNN(mode="inference", config=config,
                                  model_dir=DEFAULT_LOGS_DIR)
    weights_path = DEFAULT_MRCNN_MODEL_DIR
    mrcnn_model.load_weights(weights_path, by_name=True)

    ##### EFFICIENTNET

    efficient_net = EfficientNetB0(
        weights='imagenet',
        input_shape=(32, 32, 3),
        include_top=False,
        pooling='max'
    )

    eff_model = Sequential()
    eff_model.add(efficient_net)
    eff_model.add(Dense(units=120, activation='relu'))
    eff_model.add(Dense(units=120, activation='relu'))
    eff_model.add(Dense(units=1, activation='sigmoid'))
    eff_model.summary()

    eff_model.compile(optimizer=Adam(lr=0.0001), loss='binary_crossentropy', metrics=['accuracy'])

    eff_model.load_weights(DEFAULT_EFF_MODEL_DIR)
    #############################################################################3

    # each image in folder
    image_path = DEFAULT_IMAGE_DIR
    image_dir = os.path.join(image_path + "/test")
    dirs = os.listdir(image_dir)

    images = [file for file in dirs if file.endswith('.png') or file.endswith('.jpg') or file.endswith('.bmp')]
    #images.sort()
    random.shuffle(images)
    random.shuffle(images)
    
    # print("len iamges :::: ", len(images))
    result = []
    submission = {}
    err_toothbrush_total = []
    each_toothbrush_info_total =[]
    ## arrange results and make csv file
    for img in images:
        imgname = os.path.join(image_dir, img)
        onlyname, _ = os.path.splitext(img)
        imgname_png = onlyname + '.png'
        # output_imgname = os.path.join(image_path, imgname_png)
    
        bv = detect_and_color_splash(mrcnn_model, image_path=imgname, img_file_name=imgname_png)
        #detect_and_color_splash(mrcnn_model, image_path=imgname, img_file_name=imgname_png)
        
        result = binary_classification(onlyname, eff_model, bv)
        submission[onlyname] = result
        #print("submission : ", submission)

    TN = 0
    TP = 0
    normal_file = 0
    error_file = 0
    total_test_img = len(submission) - 2

    for i in submission:
        if "Frame" in i and "dummy" not in i:
            normal_file += 1
        if "Frame" not in i and "dummy" not in i:
            error_file += 1
        if "dummy" in i:
            continue
        if "Frame" not in i and submission[i] == 0:
            TN += 1
        elif "Frame" in i and submission[i] == 1:
            TP +=  1   ### compute time
            
        
    total_end = time.time()
    print("total time : ", total_end- total_start)
    detect_avg = np.floor((sum(detect_time, 0.0) / len(detect_time)) * 10) /10
    classi_avg = np.floor((sum(class_time, 0.0) / len(class_time)) * 10) / 10
    acc = (TN + TP) / total_test_img
    print("length of detect_time : ", len(detect_time))
    print("length of class_time : ", len(class_time))
    total_avg = detect_avg + classi_avg
    print("total_test_img", total_test_img)
    print("normal_file : ", normal_file)
    print("err_file : ", error_file)
    print("Average classification time : ", classi_avg)
    print("Average detection time : ", detect_avg)
    print("==========================================================")
    print("True Positive", TP)
    print("True Negative", TN)
    # print(f"(TP + TN) / 전체이미지 : ({TP} + {TN}) / {len(images)}")
    print("Accuracy : ", round(acc, 2)*100, "%")
    print("Average Time per Image : ", total_avg, "s")