File size: 955 Bytes
625a17f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
import json
import random

#json_path = "/data/work-gcp-europe-west4-a/yuqian_fu/Ego/data_segswap/egoexo_val_framelevel_all.json"
json_path = "/data/work-gcp-europe-west4-a/yuqian_fu/datasets/HANDAL/handal_dataset_mugs/handal_train.json"
output_path = "/data/work-gcp-europe-west4-a/yuqian_fu/datasets/HANDAL/handal_dataset_mugs/handal_test100.json"

#random.seed(42)
# 读取原始的完整数据
with open(json_path, 'r') as f:
    data_full = json.load(f)


# # 计算三分之一的数据量
# third_size = len(data_full) // 3


# # 随机选择三分之一的数据
# # data_smallsize = random.sample(data_full, third_size)

# # 按照原顺序,每间隔三个数据存储一个
#data_smallsize = data_full[:100]

data_smallsize = random.sample(data_full, 100)

# 将缩小后的数据保存到新的json文件中
with open(output_path, 'w') as f:
    json.dump(data_smallsize, f)

print(f'Saved {len(data_smallsize)} samples to smallsize_version')