prepareGTA.py

# encoding: utf-8
"""
@author:  jixunbo
@contact: jixunbo@gmail.com
"""


import os
import os.path as osp
import csv
from shutil import copyfile
import cv2
import time
import configparser
import numpy as np
import random

# You only need to change these lines to your dataset download path
download_path = '/Users/jixunbo/Downloads/Train_single_view'
# download_path = '/Users/jixunbo/Downloads/'

label_path = '/Users/jixunbo/Desktop/ReIDataset/MOT17Labels'
# save_path = '/content/drive/My Drive/GTA'
save_path = '/Users/jixunbo/Desktop/GTA1'
crop_W = 64
crop_H = 128
val_num = 0  # To random select number of frames allcated to validation
query_num = 3  # To random select number of frames allcated to query
min_frames = 5  # To check the sequence longer than 5 frames
num_sample = 20


def _sequence(seq_name, _mot_dir, _mot17_label_dir, _dets, _vis_threshold):
    _train_folders = os.listdir(_mot_dir)
    # _test_folders = os.listdir(os.path.join(_mot_dir, 'test'))
    # _train_folders = _mot_dir
    if seq_name:
        assert seq_name in _train_folders, \
            'Image set does not exist: {}'.format(seq_name)

    if seq_name in _train_folders:
        seq_path = osp.join(_mot_dir, seq_name)
#         label_path = osp.join(self._label_dir, 'train', 'MOT16-'+seq_name[-2:])
        mot17_label_path = osp.join(_mot17_label_dir, 'train')
    else:
        seq_path = osp.join(_mot_dir, 'test', seq_name)
#         label_path = osp.join(self._label_dir, 'test', 'MOT16-'+seq_name[-2:])
        mot17_label_path = osp.join(_mot17_label_dir, 'test')
#     raw_label_path = osp.join(self._raw_label_dir, 'MOT16-'+seq_name[-2:])

    config_file = osp.join(seq_path, 'seqinfo.ini')

    assert osp.exists(config_file), \
        'Config file does not exist: {}'.format(config_file)

    config = configparser.ConfigParser()
    config.read(config_file)
    seqLength = int(config['Sequence']['seqLength']) 
    # imDir = config['Sequence']['imDir']

    # imDir = osp.join(seq_path, imDir)
    # gt_file = osp.join(seq_path, 'gt', 'gt.txt')

    total = []
    train = []
    val = []

    visibility = {}
    boxes = {}
    cams = {}

    for i in range(1, seqLength*2 + 1):
        boxes[i] = {}
        visibility[i] = {}
        cams[i] = []

    cam='camera1'
    gt_file = osp.join(
        seq_path, 'gt', '{}_new_gt_with_pid.txt'.format(cam))

    no_gt = False
    if osp.exists(gt_file):
        with open(gt_file, "r") as inf:
            reader = csv.reader(inf, delimiter=',')
            for row in reader:
                # print(row)
                # class person, certainity 1, visibility >= 0.25
                if int(row[6]) == 1 and int(row[7]) == 1 and float(row[8]) >= _vis_threshold:
                    # Make pixel indexes 0-based, should already be 0-based (or not)
                    x1 = int(row[2]) - 1
                    y1 = int(row[3]) - 1
                    # This -1 accounts for the width (width of 1 x1=x2)
                    x2 = x1 + int(row[4]) - 1
                    y2 = y1 + int(row[5]) - 1
                    bb = np.array([x1, y1, x2, y2], dtype=np.float32)
                    boxes[int(row[0])*2-1][int(row[1])] = bb
                    visibility[int(row[0])*2-1][int(row[1])] = float(row[8])
    else:
        no_gt = True
    
    cam='camera2'
    gt_file = osp.join(
        seq_path, 'gt', '{}_new_gt_with_pid.txt'.format(cam))

    no_gt = False
    if osp.exists(gt_file):
        with open(gt_file, "r") as inf:
            reader = csv.reader(inf, delimiter=',')
            for row in reader:
                # print(row)
                if int(row[0])==0:
                    continue
                # class person, certainity 1, visibility >= 0.25
                if int(row[6]) == 1 and int(row[7]) == 1 and float(row[8]) >= _vis_threshold:
                    # Make pixel indexes 0-based, should already be 0-based (or not)
                    x1 = int(row[2]) - 1
                    y1 = int(row[3]) - 1
                    # This -1 accounts for the width (width of 1 x1=x2)
                    x2 = x1 + int(row[4]) - 1
                    y2 = y1 + int(row[5]) - 1
                    bb = np.array([x1, y1, x2, y2], dtype=np.float32)
                    boxes[int(row[0])*2][int(row[1])] = bb
                    visibility[int(row[0])*2][int(row[1])] = float(row[8])
    else:
        no_gt = True
        # det_file = osp.join(
        #     mot17_label_path,
        #     f"{seq_name}-{_dets[:-2]}",
        #     'det',
        #     'det.txt')

        # if osp.exists(det_file):
        #     with open(det_file, "r") as inf:
        #         reader = csv.reader(inf, delimiter=',')
        #         for row in reader:
        #             x1 = float(row[2]) - 1
        #             y1 = float(row[3]) - 1
        #             # This -1 accounts for the width (width of 1 x1=x2)
        #             x2 = x1 + float(row[4]) - 1
        #             y2 = y1 + float(row[5]) - 1
        #             score = float(row[6])
        #             bb = np.array([x1, y1, x2, y2, score], dtype=np.float32)
        #             dets[int(row[0])].append(bb)

    cam = 'camera1'
    imDir = osp.join(seq_path, cam)
    for i in range(1, seqLength*2 + 1,2):
        im_path = osp.join(imDir, "{}.jpeg".format(i))

        sample = {'seq_name': seq_name,
                  'gt': boxes[i],
                  'im_path': im_path,
                  'vis': visibility[i],
                  'cams': cam, }

        total.append(sample)
    cam = 'camera2'
    imDir = osp.join(seq_path, cam)
    for i in range(2, seqLength*2 + 1,2):
        im_path = osp.join(imDir, "{}.jpeg".format(i))

        sample = {'seq_name': seq_name,
                  'gt': boxes[i],
                  'im_path': im_path,
                  'vis': visibility[i],
                  'cams': cam, }

        total.append(sample)

    return total, no_gt


def build_samples(data, _seq_name):
    """Builds the samples out of the sequence."""

    tracks = {}
    timepoint = time.time()
    for sample in data:
        #         print(sample)

        im_path = sample['im_path']
        gt = sample['gt']
        cam = sample['cams']

        # 下面这一段的逻辑是：
        # sample是第一帧，开始sample的第一次循环，gt里包含第一帧的boundingbox之类的
        # 一开始tracks是没有值的，所以下面第一次kv in tracks没有作用，到了kv in gt
        # 的时候，tracks开始把第一帧中的人物加载进去，track[2]就表示id为2的人这一帧
        # 的信息，然后到第二个sample就是第二帧，这时kv in tracks就有用了，k=2时，如果
        # k在第二帧的gt里也出现了，则tracks里的v会append这一帧的gt，就有
        # track[2]=[{gt第一帧},{gt第二帧}]，原来tracks出现过的人物过完之后，del gt是
        # 删掉已经出现过的人的信息，然后到了下面的kv in gt 这时由于出现过的人都删掉了，所以
        # gt里只剩新人了，这时再把gt里这一帧的新人加到tracks里，以此类推一帧一帧把人都加进去

        for k, v in tracks.items():
            if k in gt.keys():
                v.append({'id': k, 'im_path': im_path,
                          'gt': gt[k], 'cams': cam})
                del gt[k]
        # For all remaining BB in gt new tracks are created
        for k, v in gt.items():
            tracks[k] = [{'id': k, 'im_path': im_path, 'gt': v, 'cams': cam}]
    # sample max_per_person images and filter out tracks smaller than 4 samples
    # outdir = get_output_dir("siamese_test")
    res = []
    # print(len(tracks.items()))

    for k, v in tracks.items():

        l = len(v)
        print('this person has {} images'.format(l))
        if l < num_sample:
            continue

        pers = []
        # print(k)
        # print(v)
        sample_idx=np.random.choice(l,size=num_sample,replace=False)

        # for i in range(l):
        for i in sample_idx:
            pers.append(build_crop(
                _seq_name, v[i]['im_path'], v[i]['gt'], crop_W, crop_H, v[i]['cams'],v[i]['id']))

            # for i,v in enumerate(pers):
            #   cv2.imwrite(osp.join(outdir, str(k)+'_'+str(i)+'.png'),v)

        res.append(np.array(pers))
    print("[*] Loaded {} persons from {} sequence.".format(len(res), _seq_name))
    print("Time used: {} seconds".format(time.time() - timepoint))

    return res
    #########################################

#     r = []
#     for idx, pers in enumerate(res):
#         for im in pers:
#             im = cv2.cvtColor(im, cv2.COLOR_BGR2RGB)
#             # im = Image.fromarray(im)
#             r.append([im, idx])
#         # print(idx,'dfdfd')


#     return r
    # self.data  format is [[idx,im],[idx,im]....]

    #########################################
    # print(np.shape(self.data[0]))

def build_crop(_seq_name, im_path, gt, crop_W, crop_H, cam,pid):
    # print(im_path)
    if im_path[-4:] != 'jpeg':
        print(im_path)
    im = cv2.imread(im_path)
    height, width, channels = im.shape
    # blobs, im_scales = _get_blobs(im)
    # im = blobs['data'][0]
    # gt = gt * im_scales[0]
    # clip to image boundary
    w = gt[2] - gt[0]
    h = gt[3] - gt[1]
    context = 0
    gt[0] = np.clip(gt[0] - context * w, 0, width - 1)
    gt[1] = np.clip(gt[1] - context * h, 0, height - 1)
    gt[2] = np.clip(gt[2] + context * w, 0, width - 1)
    gt[3] = np.clip(gt[3] + context * h, 0, height - 1)

    im = im[int(gt[1]):int(gt[3]), int(gt[0]):int(gt[2])]
    # print(im)

    im = cv2.resize(im, (int(crop_W),
                         int(crop_H)), interpolation=cv2.INTER_LINEAR)
    frame_id = im_path.split('/')[-1]
    # frame_id = frame_id.split('.')[0]

    return {'seq_name': _seq_name, 'frame_id': frame_id, 'img': im, 'cams': cam,'pid':pid}


if not os.path.isdir(download_path):
    print('please change the download_path')
if not os.path.isdir(label_path):
    print('please change the label_path')

# save_path = download_path + '/pytorch'
if not os.path.isdir(save_path):
    os.mkdir(save_path)

# _train_folders = os.listdir(os.path.join(download_path, 'train'))
# _test_folders = os.listdir(os.path.join(download_path, 'test'))
# seq_list = ['OV_underground_20_persons']
seq_list=[]
file_list = os.listdir(download_path)
for file in file_list:
    if file[:2] in ['SV','OV']:
        seq_list.append(file)
print(seq_list)

# seq_list = ['kk','ll']

train_save_path = save_path + '/train'
val_save_path = save_path + '/val'
query_save_path = save_path + '/query'
gallery_save_path = save_path + '/gallery'

if not os.path.isdir(train_save_path):
    os.mkdir(train_save_path)
    os.mkdir(val_save_path)
    os.mkdir(query_save_path)
    os.mkdir(gallery_save_path)

label_generator = 1
for seq_name in seq_list:
    data, gt = _sequence(seq_name, download_path, label_path, 'FRCNN17', 0.25)
    pers_clusters = build_samples(data, seq_name)
    num_pers = len(pers_clusters)
    _split = np.random.permutation(num_pers)
    test_split = _split[:int(num_pers / 5)]
    trainval_split = _split[int(num_pers / 5):]
    print(trainval_split.shape, '--', test_split.shape)

    for pers in trainval_split:
        # To check if each person has more than 4 image
        if len(pers_clusters[pers]) > min_frames:
            val_count = 0
            random.shuffle(pers_clusters[pers])
            for sample in pers_clusters[pers]:
                # print(len(pers_clusters[pers]))
                if val_count < val_num:  # first 2 images is used as val image
                    # dst_path = osp.join(val_save_path, str(label_generator)+'_'+str(sample['pid']))
                    dst_path = osp.join(val_save_path, str(sample['pid']))

                else:
                    # dst_path = osp.join(train_save_path, str(label_generator)+'_'+str(sample['pid']))
                    dst_path = osp.join(train_save_path, str(sample['pid']))


                if not os.path.isdir(dst_path):
                    os.mkdir(dst_path)
                    # first image is used as val image
                cv2.imwrite(osp.join(dst_path, '{}_{}_{}_{}'.format(
                    sample['seq_name'], sample['pid'],sample['cams'], sample['frame_id'])), sample['img'])
                val_count += 1
            label_generator += 1

    for pers in test_split:

        if len(pers_clusters[pers]) > min_frames:
            query_count = 0
            random.shuffle(pers_clusters[pers])

            for sample in pers_clusters[pers]:

                if query_count < query_num:  # first 2 images is used as val image
                    # dst_path = osp.join(query_save_path, str(label_generator)+'_'+str(sample['pid']))
                    dst_path = osp.join(query_save_path, str(sample['pid']))

                else:
                    # dst_path = osp.join(gallery_save_path,
                    #                     str(label_generator)+'_'+str(sample['pid']))
                    dst_path = osp.join(gallery_save_path, str(sample['pid']))

                if not os.path.isdir(dst_path):
                    os.mkdir(dst_path)
                cv2.imwrite(osp.join(dst_path, '{}_{}_{}_{}'.format(
                    sample['seq_name'], sample['pid'],sample['cams'], sample['frame_id'])), sample['img'])
                query_count += 1

            label_generator += 1