Python 提取圖像信息保存爲TXT、xml格式

1.首先提取圖像爲TXT格式，格式如下: xxxx.jpg 通道數 xmin,ymin,xmax,ymax

2.代碼如下

# -*- coding:utf-8 -*-

'''
作者：tanbin
時間：2019年10月31日
代碼工作內容：1.對文件下sex_image/*.jpg進行重命名
            2.對對文件下sex_image/*.jpg


'''


import os
import cv2
import xml.etree.ElementTree as ET
from  PIL import  Image
import numpy as np




#圖像處理類  內置各種函數
class image_processing():

    def __init__(self):
        self.img_path="./sex_image/"
        self.annotations_txt_path="./"
        self.annotations_xml_path="./sex_xml/"
        if not os.path.exists(self.annotations_xml_path):
               os.makedirs(self.annotations_xml_path)

    #圖像批量重命名
    def rename(self):
        imagelist = os.listdir(self.img_path)
        total_num = len(imagelist) #得到圖像數量大小

        i=4500
        for item in imagelist:
                # print item
            if item.endswith('.jpg'):
                src = os.path.join(os.path.abspath(self.img_path), item)
                dst = os.path.join(os.path.abspath(self.img_path), '00' + format(str(i), '0>4s') + '.jpg')
                os.rename(src, dst)
                print ('converting %s to %s ...' % (src, dst))
                i = i + 1
        print('total %d to rename & converted %d jpgs' % (total_num, i))


    #提取圖像的shape到txt文件裏
    def get_image_information(self):
        image_list=os.listdir(self.img_path)
        print image_list
        total_num=len(image_list)

        file_txt=open('./sex_image_txt.txt',"w")

        for i in range(10):
            img=cv2.imread(os.path.join(self.img_path+image_list[i]))
            image_shape=img.shape
            print image_shape
            file_txt.write(image_list[i]+' '+'3 '+'5 '+'5 '+str(image_shape[0]-5)+str(image_shape[1]-5))
        file_txt.close()


if __name__ == '__main__':
    newname = image_processing()
    #newname.rename()
    newname.get_image_information()

得到一個txt文件，裏面內容如圖

3.Python提取圖像信息爲xml

# -*- coding:utf-8 -*-
from xml.dom.minidom import Document
import os
from PIL import Image

ann_path = "./sex_image_txt.txt"
img_path = "./sex_image/"
xml_path = "./sex_xml_2/"

#標籤的類別
label_list = ["salacity"]

if not os.path.exists(xml_path):
    os.mkdir(xml_path)

def writeXml(imgname,imgpath, w, h, label_list, wxml):
    doc = Document()
    #owner
    annotation = doc.createElement('annotation')
    doc.appendChild(annotation)
    #owner
    folder = doc.createElement('folder')
    annotation.appendChild(folder)
    folder_txt = doc.createTextNode("R_dataset")
    folder.appendChild(folder_txt)

    filename = doc.createElement('filename')
    annotation.appendChild(filename)
    filename_txt = doc.createTextNode(imgname)
    filename.appendChild(filename_txt)

    path = doc.createElement('path')
    annotation.appendChild(path)
    path_txt = doc.createTextNode(imgpath)
    path.appendChild(path_txt)
    #ones#
    source = doc.createElement('source')
    annotation.appendChild(source)

    database = doc.createElement('database')
    source.appendChild(database)
    database_txt = doc.createTextNode("The R Database")
    database.appendChild(database_txt)
    #onee#
    #twos#
    size = doc.createElement('size')
    annotation.appendChild(size)

    width = doc.createElement('width')
    size.appendChild(width)
    width_txt = doc.createTextNode(str(w))
    width.appendChild(width_txt)

    height = doc.createElement('height')
    size.appendChild(height)
    height_txt = doc.createTextNode(str(h))
    height.appendChild(height_txt)

    depth = doc.createElement('depth')
    size.appendChild(depth)
    depth_txt = doc.createTextNode("3")
    depth.appendChild(depth_txt)
    #twoe#
    segmented = doc.createElement('segmented')
    annotation.appendChild(segmented)
    segmented_txt = doc.createTextNode("0")
    segmented.appendChild(segmented_txt)

    # object
    object = doc.createElement('object')
    annotation.appendChild(object)

    name = doc.createElement('name')
    object.appendChild(name)
    name_content = doc.createTextNode(label_list[0])
    name.appendChild(name_content)

    pose=doc.createElement('pose')
    object.appendChild(pose)
    pose_content=doc.createTextNode("0")
    pose.appendChild(pose_content)

    truncated=doc.createElement('truncated')
    object.appendChild(truncated)
    truncated_content=doc.createTextNode("0")
    truncated.appendChild(truncated_content)

    difficult=doc.createElement('difficult')
    object.appendChild(difficult)
    difficult_content=doc.createTextNode("0")
    difficult.appendChild(difficult_content)

    bndbox=doc.createElement('bndbox')
    object.appendChild(bndbox)

    xmin=doc.createElement('xmin')
    bndbox.appendChild(xmin)
    xmin_content=doc.createTextNode(str(5))
    xmin.appendChild(xmin_content)

    ymin=doc.createElement('ymin')
    bndbox.appendChild(ymin)
    ymin_content=doc.createTextNode(str(5))
    ymin.appendChild(ymin_content)


    xmax=doc.createElement('xmax')
    bndbox.appendChild(xmax)
    xmax_content=doc.createTextNode(str(w-5))
    xmax.appendChild(xmax_content)

    ymax=doc.createElement('ymax')
    bndbox.appendChild(ymax)
    ymax_content=doc.createTextNode(str(h-5))
    ymax.appendChild(ymax_content)

        #threee#
    with open(wxml, "w") as f:
        f.write(doc.toprettyxml(indent = '\t', encoding='utf-8'))
        #f.write(doc.toprettyxml())
    f.close()

    return


f = open(ann_path, 'r')
txt_list = f.readlines()
f.close()
im_name_list = []

for line in txt_list:
    line = line.strip()
    line_split = line.split(' ')
    # print  line

    img_name = line_split[0]
    im_name_list.append(img_name)


    fileimgpath = os.path.join(img_path, img_name)
    im=Image.open(fileimgpath)
    width= int(im.size[0])
    height= int(im.size[1])
    # print width,height
    # print label_list
    savename = os.path.join(xml_path , img_name.split('.')[0] + '.xml')
    writeXml(img_name,fileimgpath, width, height, label_list, savename)

結果如圖如下所示：

ps:

這裏採用OpenCv 、PIL.image提取圖像的寬高有細微的差別：

PIL的提取圖像大小用的是image.size，而OpenCV對應的是image.shape。

另外image.size默認輸出的結果是寬和高，而OPenCV默認輸出的結果是高和寬。【具體的參考博客Python實現圖像處理：PIL和OpenCV提取圖像大小的方法和區別】

Python 提取圖像信息保存爲TXT、xml格式

再談23種設計模式（3）：行爲型模式（學習筆記）

Power Automate Desktop 安裝完，登錄後老是提示one driver 錯誤

微前端學習筆記(4):從微前端到微模塊之EMP與hel-micro方案探索

微前端學習筆記（1）：微前端總體架構概述，從微服務發微

985 碩士程序員，空窗 4 個月沒有 Offer！

一文搞懂 Spring 循環依賴

賽博鬥地主——使用大語言模型扮演Agent智能體玩牌類遊戲。

VScode右鍵打開(添加到右鍵)

記一次 .NET某工控視覺自動化系統卡死分析

WindowsServer--SQL Server搭建主從同步實現讀寫分離 - 事務性分發

python txt預處理，處理成需要的格式

Ubuntu鏡像軟件下載

Python 提取圖像信息保存爲TXT、xml格式

python處理圖像文件中損壞的圖片以及批量裁剪指定的圖片大小

刪除xml或者圖像文件夾多餘的文件

Mac下配置sublime實現LaTeX

https://yachay.unat.edu.pe/blog/index.php?comment_area=format_blog&comment_component=blog&comment_co

linux以太網驅動總結