# coding: utf-8 from re import sub from unidecode import unidecode def readFile(filename): data = None dataFile = str() with open(filename, 'r') as f: data = f.readlines() for d in data: u = unidecode(d.lower(), 'utf-8') dataFile += sub(r'[^a-z]', '', u) return dataFile def countLetters(text): # Get number of letters totalLetters = 0 for letter in text: totalLetters += 1 return totalLetters