import sys, re, htmlentitydefs, time entry = open(sys.argv[1]).read() getText = re.compile('', body) body = re.sub(''', "'", body) for e in htmlentitydefs.entitydefs: body = re.sub('&'+e+';', htmlentitydefs.entitydefs[e], body) print "DATE:", date print "-----" print "BODY:" print body print "--------"