YuqianFu's picture
Upload folder using huggingface_hub
625a17f verified
import json
import random
#json_path = "/data/work-gcp-europe-west4-a/yuqian_fu/Ego/data_segswap/egoexo_val_framelevel_all.json"
json_path = "/data/work-gcp-europe-west4-a/yuqian_fu/datasets/HANDAL/handal_dataset_mugs/handal_train.json"
output_path = "/data/work-gcp-europe-west4-a/yuqian_fu/datasets/HANDAL/handal_dataset_mugs/handal_test100.json"
#random.seed(42)
# 读取原始的完整数据
with open(json_path, 'r') as f:
data_full = json.load(f)
# # 计算三分之一的数据量
# third_size = len(data_full) // 3
# # 随机选择三分之一的数据
# # data_smallsize = random.sample(data_full, third_size)
# # 按照原顺序,每间隔三个数据存储一个
#data_smallsize = data_full[:100]
data_smallsize = random.sample(data_full, 100)
# 将缩小后的数据保存到新的json文件中
with open(output_path, 'w') as f:
json.dump(data_smallsize, f)
print(f'Saved {len(data_smallsize)} samples to smallsize_version')