视频教程 所用到的数据集在视频的简介里:数据集-hymenoptera_data-train
或者在官网下载数据集
用到的一些python的基础知识
conda install opencv-python pip install opencv-python img = Image.open(img_path) # 打开图片 img.show() # 展示图片 root_dir = "dataset/train" label_dir = "ants" # 连接两个字符串 path = os.path.join(root_dir, label_dir)
from torch.utils.data import Dataset
from PIL import Image
import os
class MyData(Dataset):
def __init__(self, root_dir, label_dir):
self.root_dir = root_dir
self.label_dir = label_dir
self.path = os.path.join(self.root_dir, self.label_dir)
self.img_path = os.listdir(self.path) # 打开存储图片的文件夹
# 返回训练样本
def __getitem__(self, idx):
img_name = self.img_path[idx]
img_item_path = os.path.join(self.root_dir, self.label_dir, img_name)
img = Image.open(img_item_path)
label = self.label_dir
return img, label
def __len__(self):
return len(self.img_path)
if __name__=='__main__':
root_dir = "dataset/train"
ants_label_dir = "ants"
bees_label_dir = "bees"
ants_dataset = MyData(root_dir=root_dir, label_dir=ants_label_dir)
bees_dataset = MyData(root_dir, bees_label_dir)
print(len(ants_dataset))
train_dataset = ants_dataset + bees_dataset
print(len(train_dataset))
import os
root_dir = "dataset/train"
target_dir = "ants_image"
img_path = os.listdir(os.path.join(root_dir, target_dir))
label = target_dir.split('_')[0]
out_dir = "ants_label"
for i in img_path:
file_name = i.split('.jpg')[0]
with open(os.path.join(root_dir, out_dir, "{}.txt".format(file_name)), 'w')as f:
f.write(label)



