ls -l conll16st-en-01-12-16-trial import json import codecs pdtb_file = codecs.open('conll16st-en-01-12-16-trial/relations.json', encoding='utf8') relations = [json.loads(x) for x in pdtb_file]; example_relation = relations[10] example_relation data = codecs.open('conll16st-zh-01-08-2016-trial/relations.json', encoding='utf8') chinese_relations = [json.loads(x) for x in data] chinese_relations[13] print 'Arg1 : %s\nArg2 : %s' % (chinese_relations[13]['Arg1']['RawText'], chinese_relations[13]['Arg2']['RawText']) parse_file = codecs.open('conll16st-en-01-12-16-trial/parses.json', encoding='utf8') en_parse_dict = json.load(parse_file) en_example_relation = relations[10] en_doc_id = en_example_relation['DocID'] print en_parse_dict[en_doc_id]['sentences'][15]['parsetree'] parse_file = codecs.open('conll16st-zh-01-08-2016-trial/parses.json', encoding='utf8') zh_parse_dict = json.load(parse_file) zh_example_relation = chinese_relations[13] zh_doc_id = zh_example_relation['DocID'] print zh_parse_dict[zh_doc_id]['sentences'][5]['parsetree'] en_parse_dict[en_doc_id]['sentences'][15]['dependencies'] en_parse_dict[en_doc_id]['sentences'][15]['words'][0] en_parse_dict[en_doc_id]['sentences'][15]['words'][1] supp_data = open('conll16st-en-01-12-16-trial/relations-no-senses.json') relations_no_senses = [json.loads(x) for x in supp_data] relations_no_senses[10] all_tokens = [token for sentence in en_parse_dict[en_doc_id]['sentences'] for token in sentence['words']] for token in all_tokens[0:20]: for linker in token[1]['Linkers']: role, relation_id = linker.split('_') print '%s \t is part of %s in relation id %s' % (token[0], role, relation_id) print 'Relation ID is %s' % relations[13]['ID'] print 'Arg 1 : %s' % relations[13]['Arg1']['RawText'] for x in open('conll16st-en-01-12-16-trial/conll_format/wsj_1000.conll').readlines()[0:5]: print x[0:40] output_relations = [json.loads(x) for x in codecs.open('output.json', encoding='utf8')] output_relations[10]