#!/usr/bin/env python # -*- coding: utf-8 -*- from codecs import open en2el = open('corpora/en2el.txt', encoding='utf-8', mode='r').readlines() en2el = [pair.strip().split('\t') for pair in en2el] greek = [el for en,el in en2el] for word in greek: print word letters = set(list(''.join(greek))) out = open('/tmp/greek.txt', encoding='utf-8', mode='w') out.write('\n'.join(greek)) print ' '.join( sorted(letters))