import pprint, sys f = open('/u1/junk/kinne/GRCh38.p12.genome.fa', 'r') count = {} for line in f: for character in line: count.setdefault(character, 0) count[character] = count[character] + 1 f.close() pprint.pprint(count)