convert.py 336 字节
Newer Older
X
xixiaoyao 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18
# coding: utf-8
f='mrqa-combined.train.raw.json'
import json
a=json.load(open(f))
a=a['data']
writer = open('train.json','w')
    
for s in a:
    p = s['paragraphs']
    assert len(p) == 1
    p = p[0]
    q = {}
    q['context'] = p['context']
    q['qa_list'] = p['qas']
    writer.write(json.dumps(q)+'\n')
    
writer.close()