File size: 595 Bytes
b031362
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
import json


def load_data(file_path='train.json',num_samples=2000):
    data = []
    with open(file_path, 'r', encoding='utf-8') as file:
        for line in file:
            try:
                data.append(json.loads(line))
            except json.JSONDecodeError as e:
                print(f"Error decoding JSON: {e}")
    return data[:num_samples]


if __name__ == '__main__':

    #数据集切分
    dataset = load_data()
    with open('train_2000.json', 'w', encoding='utf-8') as file:
        for item in dataset:
            file.write(json.dumps(item, ensure_ascii=False) + '\n')