Python图像综合处理相关类

self.Font 下载地址：https://jhc001.lanzoub.com/i531g0wlq9kj
# !/usr/bin/env python3
# -*- coding: UTF-8 -*-
"""
@author  : v_jiaohaicheng@baidu.com
@des     :

"""
import json
import cv2 as cv
import numpy as np
import copy
import PIL.JpegImagePlugin
from PIL import ImageFont, Image, ImageDraw
from sdk.utils.util_file import FileProcess
from sdk.utils.util_folder import FolderPathProcess


class ImgMark():
    """
    图像标注转化处理类
    """
    def __init__(self):
        # 是否标注文字
        self.TEXT = True
        # 是否标注文字序号
        self.INDEX = True
        # 是否标注后缀
        self.TEXT_TAIL = True
        # 标注文本后缀
        self.text_tail = "中文"
        # 是否标注线，框
        self.MARK = True
        # 标注文字大小
        self.SIZE = 15
        # 文字位置 True:左上，False:右下
        self.WORD_POS = False
        # 标注字体格式
        self.Font = R"SourceHanSerifSC-Bold.otf"
        # 标注框颜色
        self.COLOR = (255, 0, 0)
        # 标注字颜色
        self.TXT_COLOR = "green"
        # 标注线粗
        self.THICKNESS = 1
        # 绘制 框/线 True:线 False:框
        self.LINE = False
        # 标注线类型
        self.LINE_TYPE = cv.LINE_8

        # 加载文本处理类(自定义的)
        self.Fpr = FileProcess()
        # 加载文件夹处理类(自定义的)
        self.Fpp = FolderPathProcess()

    def get_copy(self, args: [dict, list, str, int, tuple, json]) -> copy:
        """
        返回拷贝
        :param args:
        :return:
        """
        return copy.deepcopy(args)

    def read_image(self, file: str) -> np:
        """
        读取图片，支持中文路径
        :param file:
        :return:
        """
        return np.asarray(Image.open(file))

    def tran_gray(self, img: np) -> np:
        """
        转灰度图
        :param img:
        :return:
        """
        return cv.cvtColor(img, cv.COLOR_BGR2GRAY)

    def tran_binary(self,img:np)->np:
        """
        二值化
        :param img:
        :return:
        """
        if not self.check_is_gray(img):
            img = self.tran_gray(img)
        ret2,img=cv.threshold(img,0, 255, cv.THRESH_BINARY + cv.THRESH_OTSU)
        return img

    def check_is_gray(self,img:np)->bool:
        """
        判断图像是否为灰度图
        :param img:
        :return:
        """
        img = Image.fromarray(np.uint8(img))
        return img.mode == "L" or img.mode =="LA"

    def get_img_shape(self, img: np) -> tuple:
        """
        获取图像 shape
        :param img:
        :return:(h,w,b)
        """
        return img.shape

    def resize(self, img: np,
               newsize: tuple[int, int] = None, rate: int = None) -> np:
        """
        调整图像大小
        :param img:
        :param size:
        :return:
        """
        if rate:
            origin_h, origin_w, byway = self.get_img_shape(img)
            if rate >= 0:
                new_h = int(origin_h * rate)
                new_w = int(origin_w * rate)
            else:
                new_h = int(origin_h / abs(rate))
                new_w = int(origin_w / abs(rate))
            newsize = (new_h, new_w)

        return np.asarray(Image.fromarray(np.uint8(img)).resize(newsize))

    def transpose_image(
            self, img: [np.ndarray, PIL.JpegImagePlugin.JpegImageFile], key: int = 0) -> np:
        """
        旋转,逆时针
        :param img:
        :param key:
        :return:
        """
        if isinstance(img, np.ndarray):
            return np.asarray(Image.fromarray(np.uint8(img)).rotate(key))
        if isinstance(img, PIL.JpegImagePlugin.JpegImageFile):
            return img.rotate(key)
        else:
            raise ValueError("type error {}".format(type(img)))

    def mirror(self,img:np,key:int):
        """
        镜像
        :param img:
        :param key:0:垂直翻转,1:水平翻转
        :return:
        """
        return cv.flip(img,key)

    def save_image(self, img: np, file: str):
        """
        保存图片
            self.Fpr.get_file_tail:获取文件后缀
        :param img:
        :param file:
        :param img_type:
        :return:
        """
        cv.imencode(
            ".{}".format(self.Fpr.get_file_tail(file)), cv.cvtColor(
                img, cv.COLOR_RGB2BGR))[1].tofile(file)

    def add_words(self, img: np, map: dict) -> np:
        """
        添加文字 支持中，英文
        :param img:
        :param map:{
            "index":{
                "text":"",
                "opt":[]
            }
        }
        :return:
        """

        font = ImageFont.truetype(self.Font, size=self.SIZE)
        for index, value in map.items():
            img = Image.fromarray(np.uint8(img))
            draw = ImageDraw.Draw(img)
            min_x, max_y = self.get_m_opt(value["opt"])

            if self.WORD_POS:
                xy = min_x
            else:
                xy = max_y

            if not self.TEXT:
                value["text"] = ""

            if self.INDEX:
                text = "{}.{}".format(int(index) + 1, value["text"])
                # 去掉 .
                if not self.TEXT:
                    text = text[:-1]
            else:
                text = value["text"]
            # 在只标注索引情况下，不显示后缀的标注
            if self.TEXT:
                if self.TEXT_TAIL:
                    text = "{}_{}".format(text, self.text_tail)

            draw.text(
                xy=xy,
                text=text,
                font=font,
                fill=self.TXT_COLOR,
            )

            img = cv.cvtColor(np.asarray(img), cv.COLOR_RGB2RGBA)

        return img

    def get_m_opt(self, list: list) -> tuple[list, list]:
        """
        获取 右上角坐标，左下角坐标 附带偏移量
        :param list:
        :return:
        """
        min_x = [100000000, 100000000]
        max_y = [0, 0]
        for args in list:
            # 赋值时复制个副本操作，避免下边计算偏移量时影响原值
            if args[0] < min_x[0]:
                min_x = args[::]
            if args[1] > max_y[1]:
                max_y = args[::]
        # 计算偏移量
        min_x[1] = min_x[1] - self.SIZE - 5
        max_y[1] = max_y[1] - self.SIZE - 5

        return (min_x, max_y)

    def mark(self, img: np, map: dict) -> np:
        """
        添加 框、线
        :param img:
        :param map:
        :return:
        """
        if self.MARK:
            for index, value in map.items():
                single = False
                args = value["opt"]
                if len(args) == 2:
                    if not self.LINE:
                        cv.rectangle(
                            img=img,
                            pt1=tuple(args[0]),
                            pt2=tuple(args[1]),
                            color=self.COLOR,
                            thickness=self.THICKNESS,
                            lineType=self.LINE_TYPE,
                        )
                        single = True

                if single:
                    continue
                img = cv.polylines(
                    img=img,
                    pts=[np.array(args, dtype=np.int32)],
                    isClosed=not self.LINE,
                    color=self.COLOR,
                    thickness=self.THICKNESS,
                    lineType=self.LINE_TYPE
                )

        return img

    def add_mosaic(self, img: np, opt: tuple[[int, int], [
                   int, int]], neighbor: int = 5) -> np:
        """
        添加马赛克
        :param img:
        :param opt:[左上，右下]
        :param neighbor:
        :return:
        """
        fh, fw, fb = self.get_img_shape(img)
        x, y = opt[0]
        w, h = opt[1][0] - opt[0][0], opt[1][1] - opt[0][1]
        if (y + h > fh) or (x + w > fw):
            pass
        else:
            for i in range(0, h - neighbor, neighbor):
                for j in range(0, w - neighbor, neighbor):
                    rect = [j + x, i + y, neighbor, neighbor]
                    color = tuple(img[i + y][j + x].tolist())
                    left_up = (rect[0], rect[1])
                    right_down = (
                        rect[0] + neighbor - 1,
                        rect[1] + neighbor - 1)
                    img = cv.rectangle(img, left_up, right_down, color, -1)
        return img

    def cut_img(self, img: np, opt: tuple[[int, int], [int, int]]) -> np:
        """
        裁切图片
        :param img:
        :param opt:([左上]，[右下])
        :return:
        """

        return img[opt[0][1]:opt[1][1], opt[0][0]:opt[1][0]]

    def change_light_contrast(
            self, img: np, light: int = None, contrast: float = None) -> np:
        """
        调整亮度 对比度
        :param img:
        :param light:(-250,250)
        :param contrast:(0,1.5)
        :return:
        """
        if light:
            blank = np.zeros(img.shape, img.dtype)
            img = cv.addWeighted(img, 1, blank, 0, light)
        if contrast:
            img = cv.convertScaleAbs(img, contrast, contrast * 10)

        return img

    def make_map(self, file=None, date=None) -> dict:
        """
        从不同源 读取数据生成 map
            self.Fpr.get_line：按行获取文件内容
                返回格式：{
                    "headers": headers, # 文本标题行 list
                    "line": num, # 文本行号 num>=1
                    "date": date # 文本行内容 list
                }

        :param file: txt
        :param date: excel
        :return:
        """
        map = {}
        if file:
            for args in self.Fpr.get_line(file):
                date = args["date"]
                headers = args["headers"]
                line = args["line"]
                map[str(line)] = {
                    "opt": [[int(i[0]), int(i[1])] for i in date[headers.index("points")]],
                    "text": date[headers.index("text")],
                }
        if date:
            json_data = json.loads(date, strict=False)
            for result in json_data["result"]:
                for index, element in enumerate(result["elements"]):
                    map[index + 1] = {
                        "opt": [[int(i[0]), int(i[1])] for i in element["points"]],
                        "text": element["text"]
                    }
        return map

    def process(self, *args, **kwargs) -> list[dict]:
        """
        继承 并实现
        :return:
        """


if __name__ == '__main__':
    ip = ImgMark()
    file = R"D:\Desktop\2\1.jpg"
    save_file = R"D:\Desktop\2\1_1.png"
    img = ip.read_image(file)

    img = ip.add_mosaic(img, ([100, 150], [180, 270]))

    img = ip.transpose_image(img, 0)
    map = {
        "0": {
            "text": "中国人",
            "opt": [[10, 5], [20, 30], [70, 20], [50, 10]],
        },
        "1": {
            "text": "新冠肺炎疫情对于全球经济产生了极其深远的影响",
            "opt": [[200, 220], [220, 300], [300, 345]]
        },
        "2": {
            "text": "脑残",
            "opt": [[150, 200], [100, 150]]
        }
    }
    img = ip.add_words(
        img, ip.get_copy(map)
    )
    img = ip.mark(img, ip.get_copy(map))
    # img = ip.resize(img, rate=2)
    # img = ip.cut_img(img, ([100, 150], [180, 270]))
    # img = ip.change_light_contrast(img, contrast=1)
    # img = ip.tran_gray(img)
    img = ip.tran_binary(img)
    img = ip.mirror(img,1)
    ip.save_image(img, save_file)
文章由极客之音整理，本文链接：https://www.bmabk.com/index.php/post/156854.html
Python图像综合处理相关类

相关推荐

发表回复

分享到: