with open('frankenstein.txt', 'r', encoding='utf-8-sig') as f:  # Opens the file for reading
    text = f.read()                                             # Reads the content into a string

words = text.split()                  # Separate the text by white space to get a list of words.

word_count_dict = {}                  # Initialize an empty dictionary.
for word in words:                    # Iterate through each word in *Frankenstein*.
    if word not in word_count_dict:   # If it's a new word,
        word_count_dict[word] = 1     # add it to our dictionary with an appearance count of 1.
    else:                             # Otherwise,
        word_count_dict[word] += 1    # increase the appearance count by 1.

def word_count_key(word):
    return word_count_dict[word]

sorted_words = sorted(word_count_dict, key=word_count_key, reverse=True)

for word in sorted_words[:10]:
    print(word, word_count_dict[word])

the 4263
and 2966
of 2902
I 2794
to 2234
my 1680
a 1447
in 1175
was 1030
that 1012

for word in ['for', 'For', 'FOR']:
    print('The word "{}" appears {} times in Frankenstein.'.format(word, word_count_dict[word]))

The word "for" appears 500 times in Frankenstein.
The word "For" appears 23 times in Frankenstein.
The word "FOR" appears 3 times in Frankenstein.

words = text.split()                            # Separate the text by white space to get a list of words.

word_count_dict = {}                            # Initialize an empty dictionary.
for word in words:                              # Iterate through each word in *Frankenstein*.
    lowercase_word = word.lower()               # Convert all uppercase letters in word to lowercase.
    if lowercase_word not in word_count_dict:   # If it's a new word,
        word_count_dict[lowercase_word] = 1     # add it to our dictionary with an appearance count of 1.
    else:                                       # Otherwise,
        word_count_dict[lowercase_word] += 1    # increase the appearance count by 1.

word_count_dict['for']

526

for word in ['study', 'study,']:
    print('The word "{}" appears {} times in Frankenstein.'.format(word, word_count_dict[word]))

The word "study" appears 13 times in Frankenstein.
The word "study," appears 5 times in Frankenstein.

s = "This is a string, it contains some punctuation. Here's some more: !?.,"
print(s)
print(s.replace(',',''))

for c in "This is MTH 337":
    print("'{}'  ->  {}".format(c, ord(c)))

'T'  ->  84
'h'  ->  104
'i'  ->  105
's'  ->  115
' '  ->  32
'i'  ->  105
's'  ->  115
' '  ->  32
'M'  ->  77
'T'  ->  84
'H'  ->  72
' '  ->  32
'3'  ->  51
'3'  ->  51
'7'  ->  55

char_list = []
for n in [104, 101, 108, 108, 111]:
    char_list.append(chr(n))
    
txt = ''.join(char_list)
print(txt)

hello

message = 'Top secret!'
key = 'buffalo'

for c in message:
    print("'{}'  ->  {}".format(c, ord(c)))

'T'  ->  84
'o'  ->  111
'p'  ->  112
' '  ->  32
's'  ->  115
'e'  ->  101
'c'  ->  99
'r'  ->  114
'e'  ->  101
't'  ->  116
'!'  ->  33

for c in key:
    print("'{}'  ->  {}".format(c, ord(c)))

'b'  ->  98
'u'  ->  117
'f'  ->  102
'f'  ->  102
'a'  ->  97
'l'  ->  108
'o'  ->  111

(84 + 98) % 128

54

i = 0
j = 0

#grid = noisy_img[i-1:i+2, j-1:j+2]
grid = noisy_img[i:i+2, j:j+2]

def get_padded_img(img, pad)
    nrows, ncols = img.shape
    
    padded_img = np.ones((nrows + 2*pad, ncols + 2*pad))/2  # Create an array of 0.5 that will store our padded image
    padded_img[pad:-pad, pad:-pad] = img

    return padded_img

Wednesday, November 5th, 2025¶

Pre-processing text for analysis¶

Project 5 - Code breakers ¶

Background: ASCII codes¶

Text encryption¶

Image denoising thoughts¶

Wednesday, November 5th, 2025¶

Pre-processing text for analysis¶

Project 5 - Code breakers¶

Background: ASCII codes¶

Text encryption¶

Image denoising thoughts¶

Project 5 - Code breakers ¶