X-Git-Url: https://git.njae.me.uk/?a=blobdiff_plain;f=cipher.py;h=c5cd6060e208dff51eb7a1cec59649558844a62a;hb=a786efb8159cc271731dbd10ac3cf360e5236b5f;hp=446a2711bab1aeaa4b6eef951e3f08c85e0f35c8;hpb=bac232510706cdfd94d10de93d41fe9ea12f8034;p=cipher-tools.git diff --git a/cipher.py b/cipher.py index 446a271..c5cd606 100644 --- a/cipher.py +++ b/cipher.py @@ -5,6 +5,7 @@ import logging import math from itertools import zip_longest from segment import segment +from multiprocessing import Pool # To time a run: # @@ -428,6 +429,26 @@ def keyword_break(message, wordlist=keywords, metric=norms.euclidean_distance, t logger.info('Keyword break best fit with key {0} (wrap={1}) gives fit of {2} and decrypt starting: {3}'.format(best_keyword, best_wrap_alphabet, best_fit, sanitise(keyword_decipher(message, best_keyword))[:50])) return (best_keyword, best_wrap_alphabet), best_fit +def keyword_break_mp(message, wordlist=keywords, metric=norms.euclidean_distance, target_counts=normalised_english_counts, message_frequency_scaling=norms.normalise, chunksize=500): + """Breaks a keyword substitution cipher using a dictionary and frequency analysis + + >>> keyword_break_mp(keyword_encipher('this is a test message for the keyword decipherment', 'elephant', 1), wordlist=['cat', 'elephant', 'kangaroo']) # doctest: +ELLIPSIS + (('elephant', 1), 0.41643991598441...) + """ + with Pool() as pool: + helper_args = [(message, word, wrap, metric, target_counts, message_frequency_scaling) for word in wordlist for wrap in range(3)] + # breaks = map(lambda kw: keyword_break_one(message, kw[0], kw[1], metric, target_counts, message_frequency_scaling), keys) + breaks = pool.starmap(keyword_break_one, helper_args, chunksize) + return min(breaks, key=lambda k: k[1]) + +def keyword_break_one(message, keyword, wrap_alphabet, metric, target_counts, message_frequency_scaling): + plaintext = keyword_decipher(message, keyword, wrap_alphabet) + counts = message_frequency_scaling(letter_frequencies(plaintext)) + fit = metric(target_counts, counts) + logger.debug('Keyword break attempt using key {0} (wrap={1}) gives fit of {2} and decrypt starting: {3}'.format(keyword, wrap_alphabet, fit, sanitise(plaintext)[:50])) + return (keyword, wrap_alphabet), fit + + def scytale_break(message, metric=norms.euclidean_distance, target_counts=normalised_english_bigram_counts, message_frequency_scaling=norms.normalise): """Breaks a Scytale cipher