with open('../../resources/data/input.txt', 'r', encoding='utf-8') as f:
text = f.read()
# get used chars
chars = sorted(list(set(text)))
vocab_size = len(chars)
print("characters used by shakespear: "+''.join(chars))
print("this corresponds to: "+str(vocab_size)+" characters")characters used by shakespear:
!$&',-.3:;?ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz
this corresponds to: 65 characters