MTCNN中celebA數據集的處理（一個置信度，兩個座標點）

我處理這個數據集是用來訓練MTCNN網絡的，celebA數據集由202599張人臉組成，這裏主要是將樣本擴容，即在原有的圖片上摳圖。

因爲上面是MTCNN的框架，由P,R,O三個網絡組成，P網絡輸入的是12×12的圖片，R網絡輸入的是24×24的圖片，O網絡輸入的是48×48的圖片。
所以要把celebA數據集處理成三種尺寸的圖片。
又因爲損失函數有兩個，一個是置信度的損失，另一個是偏移量的損失。置信度的損失要用正樣本和負樣本做，偏移量的損失用正樣本和部分樣本做.
所以每種尺寸圖片下面又要有三種不同的樣本：正樣本（置信度爲1，整張人臉），負樣本（置信度爲0，不包含人臉），部分樣本（置信度爲2，包含人臉的一部分）。

這是celebA數據集的圖片，紅框是建議框，判斷是正樣本、負樣本，部分樣本的依據是：新生成的圖片和建議框的重疊度（iou，iou的計算方法和代碼在上一篇博客）
iou>0.4:正樣本
0.15<iou<0.4:部分樣本
iou<0.15負樣本

比如：新生成的圖片（藍框）和紅框的重疊度爲0.35，認爲是部分樣本

新生成的圖片（藍框）和紅框的重疊度爲0.1，認爲是負樣本

新生成的圖片（藍框）和紅框的重疊度爲0.8，認爲是正樣本

celebA圖片數據集：

這是兩個座標點的信息（左上角的點和右下角的點）

代碼

import os
from PIL import Image
import numpy as np
import utils
import traceback

anno_src = r"G:\數據集\celebA\celebA（分卷形式,一起解壓）\celebA\Anno\list_bbox_celeba.txt"
img_dir = r"G:\數據集\celebA\celebA（分卷形式,一起解壓）\celebA\img\img_celeba"

save_path = r"H:\dataset"

for face_size in [12,24,48]:

    print("gen %i image" % face_size)
    # 樣本圖片存儲路徑
    positive_image_dir = os.path.join(save_path, str(face_size), "positive")
    negative_image_dir = os.path.join(save_path, str(face_size), "negative")
    part_image_dir = os.path.join(save_path, str(face_size), "part")

    for dir_path in [positive_image_dir, negative_image_dir, part_image_dir]:
        if not os.path.exists(dir_path):
            os.makedirs(dir_path)

    # 樣本描述存儲路徑
    positive_anno_filename = os.path.join(save_path, str(face_size), "positive.txt")
    negative_anno_filename = os.path.join(save_path, str(face_size), "negative.txt")
    part_anno_filename = os.path.join(save_path, str(face_size), "part.txt")

    positive_count = 0
    negative_count = 0
    part_count = 0

    try:
        positive_anno_file = open(positive_anno_filename, "w")
        negative_anno_file = open(negative_anno_filename, "w")
        part_anno_file = open(part_anno_filename, "w")

        for i, line in enumerate(open(anno_src)):
            if i < 2:
                continue
            try:
                # strs = line.strip().split(" ")
                # strs = list(filter(bool, strs))
                strs = line.strip().split()
                image_filename = strs[0].strip()
                print(image_filename)
                image_file = os.path.join(img_dir, image_filename)

                with Image.open(image_file) as img:
                    img_w, img_h = img.size
                    x1 = float(strs[1].strip())
                    y1 = float(strs[2].strip())
                    w = float(strs[3].strip())
                    h = float(strs[4].strip())
                    x2 = float(x1 + w)
                    y2 = float(y1 + h)

                    px1 = 0#float(strs[5].strip())
                    py1 = 0#float(strs[6].strip())
                    px2 = 0#float(strs[7].strip())
                    py2 = 0#float(strs[8].strip())
                    px3 = 0#float(strs[9].strip())
                    py3 = 0#float(strs[10].strip())
                    px4 = 0#float(strs[11].strip())
                    py4 = 0#float(strs[12].strip())
                    px5 = 0#float(strs[13].strip())
                    py5 = 0#float(strs[14].strip())
                    #過濾字段
                    if max(w, h) < 40 or x1 < 0 or y1 < 0 or w < 0 or h < 0:
                        continue

                    boxes = [[x1, y1, x2, y2]]#建議框座標，因爲有很多[x1, y1, x2, y2]，所以用二維

                    # 計算出人臉中心點位置
                    cx = x1 + w / 2
                    cy = y1 + h / 2

                    # 使正樣本和部分樣本數量翻倍
                    for _ in range(5):
                        # 讓人臉中心點有少許的偏移
                        w_ = np.random.randint(-w * 0.5, w * 0.5)
                        h_ = np.random.randint(-h * 0.5, h * 0.5)
                        cx_ = cx + w_
                        cy_ = cy + h_

                        # 讓人臉形成正方形，並且讓座標也有少許的偏離
                        side_len = np.random.randint(int(min(w, h) * 0.8), np.ceil(1.25 * max(w, h)))#新框邊長
                        x1_ = np.max(cx_ - side_len / 2, 0)
                        y1_ = np.max(cy_ - side_len / 2, 0)
                        x2_ = x1_ + side_len
                        y2_ = y1_ + side_len

                        crop_box = np.array([x1_, y1_, x2_, y2_])#新框座標

                        # 計算座標的偏移值
                        offset_x1 = (x1 - x1_) / side_len
                        offset_y1 = (y1 - y1_) / side_len
                        offset_x2 = (x2 - x2_) / side_len
                        offset_y2 = (y2 - y2_) / side_len

                        offset_px1 = 0#(px1 - x1_) / side_len
                        offset_py1 = 0#(py1 - y1_) / side_len
                        offset_px2 = 0#(px2 - x1_) / side_len
                        offset_py2 = 0#(py2 - y1_) / side_len
                        offset_px3 = 0#(px3 - x1_) / side_len
                        offset_py3 = 0#(py3 - y1_) / side_len
                        offset_px4 = 0#(px4 - x1_) / side_len
                        offset_py4 = 0#(py4 - y1_) / side_len
                        offset_px5 = 0#(px5 - x1_) / side_len
                        offset_py5 = 0#(py5 - y1_) / side_len

                        # 剪切下圖片，並進行大小縮放
                        face_crop = img.crop(crop_box)#crop摳圖
                        face_resize = face_crop.resize((face_size, face_size))

                        iou = utils.iou(crop_box, np.array(boxes))[0]
                        if iou > 0.4:  # 正樣本
                            positive_anno_file.write(
                                "positive/{0}.jpg {1} {2} {3} {4} {5} {6} {7} {8} {9} {10} {11} {12} {13} {14} {15}\n".format(
                                    positive_count, 1, offset_x1, offset_y1,
                                    offset_x2, offset_y2, offset_px1, offset_py1, offset_px2, offset_py2, offset_px3,
                                    offset_py3, offset_px4, offset_py4, offset_px5, offset_py5))
                            positive_anno_file.flush()
                            face_resize.save(os.path.join(positive_image_dir, "{0}.jpg".format(positive_count)))
                            positive_count += 1
                        elif 0.15<iou < 0.4:  # 部分樣本
                            part_anno_file.write(
                                "part/{0}.jpg {1} {2} {3} {4} {5} {6} {7} {8} {9} {10} {11} {12} {13} {14} {15}\n".format(
                                    part_count, 2, offset_x1, offset_y1,offset_x2,
                                    offset_y2, offset_px1, offset_py1, offset_px2, offset_py2, offset_px3,
                                    offset_py3, offset_px4, offset_py4, offset_px5, offset_py5))
                            part_anno_file.flush()
                            face_resize.save(os.path.join(part_image_dir, "{0}.jpg".format(part_count)))
                            part_count += 1
                        elif iou < 0.15:
                            negative_anno_file.write(
                                "negative/{0}.jpg {1} 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n".format(negative_count, 0))
                            negative_anno_file.flush()
                            face_resize.save(os.path.join(negative_image_dir, "{0}.jpg".format(negative_count)))
                            negative_count += 1

                        # 生成負樣本，因爲按照上面的方法負樣本數量不夠
                        _boxes = np.array(boxes)

                    for i in range(5):
                        side_len = np.random.randint(face_size, min(img_w, img_h) / 2)
                        x_ = np.random.randint(0, img_w - side_len)
                        y_ = np.random.randint(0, img_h - side_len)
                        crop_box = np.array([x_, y_, x_ + side_len, y_ + side_len])

                        if np.max(utils.iou(crop_box, _boxes)) < 0.15:
                            face_crop = img.crop(crop_box)
                            face_resize = face_crop.resize((face_size, face_size), Image.ANTIALIAS)

                            negative_anno_file.write("negative/{0}.jpg {1} 0 0 0 0 0 0 0 0 0 0 0 0 0 0\n".format(negative_count, 0))
                            negative_anno_file.flush()
                            face_resize.save(os.path.join(negative_image_dir, "{0}.jpg".format(negative_count)))
                            negative_count += 1
            except Exception as e:
                traceback.print_exc()


    finally:
        positive_anno_file.close()
        negative_anno_file.close()
        part_anno_file.close()

結果

樣本的txt文件，裏面是：圖片名，置信度，四個偏移量

MTCNN中celebA數據集的處理（一個置信度，兩個座標點）

卷積、池化後特徵圖大小計算公式

python中.flush()意思

MTCNN中celebA數據集的處理（一個置信度，兩個座標點）

MTCNN中非極大值抑制NMS代碼

python中.copy()的用法

Mac下配置sublime實現LaTeX

https://yachay.unat.edu.pe/blog/index.php?comment_area=format_blog&comment_component=blog&comment_co

linux以太網驅動總結