import json | |
from tqdm import tqdm | |
import argparse | |
def save_data(data,file_path): | |
with open(file_path, 'w', encoding='utf8') as f: | |
for line in data: | |
json_data=json.dumps(line,ensure_ascii=False) | |
f.write(json_data+'\n') | |
def submit(file_path): | |
id2label={"故事": "100", | |
"文化": "101", | |
"娱乐": "102", | |
"体育": "103", | |
"财经": "104", | |
"房产": "106", | |
"汽车": "107", | |
"教育": "108", | |
"科技": "109", | |
"军事": "110", | |
"旅游": "112", | |
"国际": "113", | |
"股票": "114", | |
"农业": "115", | |
"电竞": "116"} | |
with open(file_path, 'r', encoding='utf8') as f: | |
lines = f.readlines() | |
result=[] | |
for line in tqdm(lines): | |
data = json.loads(line) | |
result.append({'id':data['id'],'label':id2label[data['choice'][data['label']]]}) | |
return result | |
if __name__=="__main__": | |
parser = argparse.ArgumentParser(description="train") | |
parser.add_argument("--data_path", type=str,default="") | |
parser.add_argument("--save_path", type=str,default="") | |
args = parser.parse_args() | |
save_data(submit(args.data_path), args.save_path) | |