core/image_handler.py

import cv2
import numpy as np


class ImagePack:
    def __init__(self, path, img_size=640, stride=32, byteMode=False, gray=False):
        if byteMode:  # 이미지 바이트 상태로 들어온 경우
            img = np.array(path)
            img = img[:, :, ::-1].copy()
            self.o_img = img
        else:

            # gif 면 첫 프레임만 따옴
            if str(path).lower().endswith('.gif'):
                gif = cv2.VideoCapture(path)
                ret, frame = gif.read()
                if ret:
                    self.o_img = frame
            else:
                # 윈도우 이미지 로드용
                win_load = np.fromfile(path, np.uint8)
                win_img = cv2.imdecode(win_load, cv2.IMREAD_COLOR)
                self.o_img = win_img

        if gray:
            # self.o_img[:, :, 0] = 0.299
            # self.o_img[:, :, 1] = 0.587
            # self.o_img[:, :, 2] = 0.114
            # cv2.imwrite('test.jpg', self.o_img)
            # np.dot(rgb[..., :3], [0.299, 0.587, 0.114])
            self.o_img = cv2.cvtColor(self.o_img, cv2.COLOR_BGR2GRAY)
            self.o_img = cv2.cvtColor(self.o_img, cv2.COLOR_GRAY2BGR)
            cv2.imwrite('test.jpg', self.o_img)

        # self.o_img = cv2.imread(path)  # 원본
        assert self.o_img is not None, '이미지를 찾을 수 없습니다 ' + path

        if self.o_img.shape[1] < 1280:
            self.o_img = self.resize_test_test(self.o_img, 1280)

        self.n_img = self.o_img  # 현재 이미지

        self.img_size = img_size
        self.stride = stride
        self.t_img = self.img2pyt(self.n_img)  # 검출용 이미지

    def img2pyt(self, imgO):
        img = letterbox(imgO, self.img_size, stride=self.stride)[0]
        img = img[:, :, ::-1].transpose(2, 0, 1)
        img = np.ascontiguousarray(img)
        return img

    def reset(self, img_size, stride):
        self.img_size = img_size
        self.stride = stride
        self.t_img = self.img2pyt(self.n_img)

    def crop(self, rect, im0s):
        x1, y1, x2, y2 = int(rect[0]), int(rect[1]), int(rect[2]), int(rect[3])
        img_crop = im0s[y1:y2, x1:x2]
        return img_crop

    def setCrop(self, rect):
        self.n_img = self.crop((rect[0][0][0], rect[0][0][1], rect[0][0][2], rect[0][0][3]), self.n_img)
        self.t_img = self.img2pyt(self.n_img)

        return self.t_img, self.n_img

    def setSizeCrop(self, rect, size):
        if self.n_img.shape[1] <= size:
            self.n_img = self.crop((rect[0][0][0], rect[0][0][1], rect[0][0][2], rect[0][0][3]), self.n_img)
        else:
            w = rect[0][0][2] - rect[0][0][0]
            x1 = rect[0][0][0]
            x2 = rect[0][0][2]

            if w < size:
                x2 = x1 + size

            self.n_img = self.crop((x1, rect[0][0][1], x2, rect[0][0][3]), self.n_img)

        self.t_img = self.img2pyt(self.n_img)

        return self.t_img, self.n_img

    def setImg(self, img):
        self.n_img = img
        self.t_img = self.img2pyt(self.n_img)

    def getImg(self):
        return self.t_img, self.n_img

    def passportCrop(self, mrz):
        x1, y1, x2, y2 = mrz
        mrzHeight = y2 - y1

        cropX1 = x1 - mrzHeight if (x1 - mrzHeight) > 0 else 0
        cropX2 = x2 + mrzHeight if (x2 + mrzHeight) < self.n_img.shape[1] else self.n_img.shape[1]
        cropY1 = y1 - mrzHeight * 3 if (y1 - mrzHeight * 3) > 0 else 0
        cropY2 = y2 + mrzHeight if (y2 + mrzHeight) < self.n_img.shape[0] else self.n_img.shape[0]

        self.n_img = self.crop((cropX1, cropY1, cropX2, cropY2), self.n_img)
        self.t_img = self.img2pyt(self.n_img)

        return self.t_img, self.n_img

    def setYCrop(self):
        self.n_img = self.crop((0, int(self.n_img.shape[0] / 2), self.n_img.shape[1], self.n_img.shape[0]),
                                       self.n_img)
        self.t_img = self.img2pyt(self.n_img)

        return self.t_img, self.n_img

    def getOImg(self):
        return self.o_img

    def resize(self, size):
        img = cv2.resize(self.n_img, dsize=(size, size))
        self.setImg(img)

    def resize_ratio(self, image, size):
        width = image.shape[1]
        height = image.shape[0]
        widthBetter = True if width > height else False

        if widthBetter:
            ratio = size / width
            img = cv2.resize(image, dsize=(size, int(height * ratio)))
        else:
            ratio = size / height
            img = cv2.resize(image, dsize=(int(width * ratio), size))

        self.setImg(img)

        return self.t_img, self.n_img

    def resize_test_test(self, image, size):
        width = image.shape[1]
        height = image.shape[0]
        widthBetter = True if width > height else False

        if widthBetter:
            ratio = size / width
            img = cv2.resize(image, dsize=(size, int(height * ratio)))
        else:
            ratio = size / height
            img = cv2.resize(image, dsize=(int(width * ratio), size))

        return img


    def makeSquareWithGray(self):
        w = self.n_img.shape[1]
        h = self.n_img.shape[0]

        if w > h:
            gray = np.zeros((w-h, w, 3), np.uint8)
            gray[:, :, :] = 178
            newImg = np.concatenate((self.n_img, gray), axis=0)
        else:
            gray = np.zeros((h, h-w, 3), np.uint8)
            gray[:, :, :] = 178
            newImg = np.concatenate((self.n_img, gray), axis=1)

        self.setImg(newImg)

    def syncImgSizeWithGray(self):
        w = self.n_img.shape[1]
        h = self.n_img.shape[0]

        size = w if w > h else h

        if size < self.img_size:
            if w > h:
                gray = np.zeros((h, self.img_size - w, 3), np.uint8)
                gray[:, :, :] = 178
                newImg = np.concatenate((self.n_img, gray), axis=1)
            else:
                gray = np.zeros((self.img_size - h, w, 3), np.uint8)
                gray[:, :, :] = 178
                newImg = np.concatenate((self.n_img, gray), axis=0)

            self.setImg(newImg)


def letterbox(img, new_shape=(640, 640), color=(114, 114, 114), auto=True, scaleFill=False, scaleup=True, stride=32):
    # Resize and pad image while meeting stride-multiple constraints
    shape = img.shape[:2]  # current shape [height, width]
    if isinstance(new_shape, int):
        new_shape = (new_shape, new_shape)

    # Scale ratio (new / old)
    r = min(new_shape[0] / shape[0], new_shape[1] / shape[1])
    if not scaleup:  # only scale down, do not scale up (for better test mAP)
        r = min(r, 1.0)

    # Compute padding
    ratio = r, r  # width, height ratios
    new_unpad = int(round(shape[1] * r)), int(round(shape[0] * r))
    dw, dh = new_shape[1] - new_unpad[0], new_shape[0] - new_unpad[1]  # wh padding
    if auto:  # minimum rectangle
        dw, dh = np.mod(dw, stride), np.mod(dh, stride)  # wh padding
    elif scaleFill:  # stretch
        dw, dh = 0.0, 0.0
        new_unpad = (new_shape[1], new_shape[0])
        ratio = new_shape[1] / shape[1], new_shape[0] / shape[0]  # width, height ratios

    dw /= 2  # divide padding into 2 sides
    dh /= 2

    if shape[::-1] != new_unpad:  # resize
        img = cv2.resize(img, new_unpad, interpolation=cv2.INTER_LINEAR)
    top, bottom = int(round(dh - 0.1)), int(round(dh + 0.1))
    left, right = int(round(dw - 0.1)), int(round(dw + 0.1))
    img = cv2.copyMakeBorder(img, top, bottom, left, right, cv2.BORDER_CONSTANT, value=color)  # add border
    return img, ratio, (dw, dh)