File size: 752 Bytes
a501a0c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
import os
import shutil
import json

source_folder = '/mnt/petrelfs/zhuchenglin/diffusion/coco/images/train2017'
target_folder = '/mnt/petrelfs/zhuchenglin/diffusion/images_large'

if not os.path.exists(target_folder):
    os.makedirs(target_folder)

anno_json_path = "/mnt/petrelfs/zhuchenglin/diffusion/coco/annotations/captions_train2017.json"
with open(anno_json_path, 'r') as f:
    annotation_data = json.load(f)
annotations = annotation_data["annotations"][:200000]

count = 0
for image in annotations:
    source_path = os.path.join(source_folder, f'{image["image_id"]:012}.jpg')
    target_path = os.path.join(target_folder, f'{image["image_id"]:012}.jpg')
    count += 1
    print(source_path,count)
    shutil.copy(source_path, target_path)