#!/usr/bin/env python # -*- coding: utf-8 -*- import codecs synsets = {} with codecs.open('wn3_synsets.txt', encoding='utf-8') as f: for line in f: e = line[:-1].split('\t') synsets[e[0]] = {} syn = synsets[e[0]] syn["gloss"] = e[2] syn["pos"] = e[3] syn["definition"] = e[4] entries = {} with codecs.open('wordnet-saldo.txt', encoding='utf-8') as f: for line in f: e = line[:-1].split('\t') entries[e[0]] = {} ent = entries[e[0]] ent["synset"] = e[1] ent["core"] = e[2] ent.update(synsets[e[1]]) with codecs.open('wordnet-saldo-relations.txt', encoding='utf-8') as f: for line in f: e = line[:-1].split('\t') if not "relations" in entries[e[0]]: entries[e[0]]["relations"] = [] rels = entries[e[0]]["relations"] rels.append((e[1],e[2])) for item in entries: print entries[item]