在做項目時遇到需要標記數據集里面的若干圖片數據,作為程序員,為避免手動一張一張的篩選,所以寫了這個Python腳本實現。
Python腳本如下:
# from PIL import Image import csv import os import shutil filename = 'img.txt' def readImageName(): with open(filename) as f: lines = f.readlines() imgnames = [] for line in lines: imgnames.append(line.strip().strip(".jpg")[-4:]) print(imgnames) return imgnames def pickImg(): pickImageNames = readImageName() # 遍歷所有圖片集的文件名 for image in os.listdir(r"C:\Users\Administrator.PC-201708272051\Desktop\項目組\text_detect_label_data\China_SameBrowser"): # print(image[:-4]) if image[:-4] in pickImageNames: # pickImage = Image.open((r"C:\Users\Administrator.PC-201708272051\Desktop\項目組\text_detect_label_data\China_SameBrowser/%s") % image) # pickImage.save((r"C:/Users/Administrator.PC-201708272051/Desktop/labeldata/%s") % image) oldname= r"C:\Users\Administrator.PC-201708272051\Desktop\項目組\text_detect_label_data\China_SameBrowser/" + image newname= r"C:/Users/Administrator.PC-201708272051/Desktop/labeldata/" + image shutil.copyfile(oldname,newname) # readImageName() pickImg()