RubyGems - substitution_solver - Versions diffs - 0.5.0 → 0.5.1 - Mend

substitution_solver 0.5.0 → 0.5.1

Files changed (4) hide show

data/dictionary_builder.rb CHANGED Viewed

@@ -1,4 +1,17 @@
 #!/usr/bin/env ruby
+# This program basically is responsible for building a new english.dic file from
+# a source ascii text file.  Feeding it a novel is probably the best idea.  You
+# want the text to be plain english, the more of it the better.
+# the format of this command is
+#  ruby dictionary_builder.rb <ascii_filename>
+require 'optparse'
+require 'rdoc/usage'
+opts = OptionParser.new
+opts.on("-h", "--help") {RDoc::usage}
+opts.parse(ARGV)
 hash = Hash.new(0)

data/dictionary_inspector.rb CHANGED Viewed

@@ -1,4 +1,19 @@
 #!/usr/bin/env ruby
+# This program is so that you can examine the contents of a english.dic file.
+# The file is a binary file that is in ruby's marshal format.
+# The usage of this command is
+#  ruby dictionary_inspector.rb
+#
+# you don't need to supply a filename, it assumes that english.dic is in the
+# currnet directory.
+require 'optparse'
+require 'rdoc/usage'
+opts = OptionParser.new
+opts.on("-h", "--help") {RDoc::usage}
+opts.parse(ARGV)
 $dictionary = Hash.new(0)                                           # The dictionary of tetragraph frequencies

data/substitution_solver.rb CHANGED Viewed

@@ -1,24 +1,37 @@
 #!/usr/bin/env ruby
+# This program is for solving simple substitution ciphers such as the
+# cryptoquotes found in the newspaper.  The usage of the command is as follows
+#  ruby substitution_solver.rb <filename>
+#
+# where <filename> is the name of an ascii text file that contains the
+# ciphertext that you would like to retrieve the plaintext of
+#
+# this command requires that english.dic be in the current working directory in
+# order to function properly.
+#
+# also be aware that this program will never return, it has no way of knowing
+# when it has achieved the correct answer, so you must hit CTRL-C to exith the
+# program
-$iteration = 0                                                      # To record how many iterations the programs
-                                                                    #  had to churn through
+require 'optparse'
+require 'rdoc/usage'
-ciphertext = String.new
+opts = OptionParser.new
+opts.on("-h", "--help") {RDoc::usage}
-File::readlines(ARGV[0]).each do |line|                             # Grab the input from the standard input
-    ciphertext << line
-end
+opts.parse(ARGV)
-ciphertext.gsub!(/[^a-zA-Z]/, "").upcase!                           # get rid of any non-alphabetic characters
+$iteration = 0                                                      # To record how many iterations the programs
+                                                                    #  had to churn through
-key = Hash.new                                                      # Create a hash that will represent the translation key
-$dictionary = Hash.new(0)                                           # The dictionary of tetragraph frequencies
-File.open("english.dic") do |f|                                     # Open the saved tetragraph information
-    $dictionary = Marshal.load(f)                                   # And load this information into our dictionary
-end
-def score(string)                                                   # This function will score a string against the tetragraph statistics
+# this function is responsible for scoring a string against the tetragraph
+# statistics
+#  Parameters:
+# * string = the string that you want to score
+#  Return Value:
+# * A number representing the score, the higher the score, the better (ie more
+#   likely to be english)
+def score(string)
     $iteration += 1                                                 # Increment the iteration count as this is probably the most fundamental loop to the program
     tally = 0                                                       # Set a counter to 0
     0.upto(string.length-4) do |x|                                  # Iterate through the string
@@ -27,7 +40,14 @@ def score(string)                                                   # This funct
     return tally                                                    # and return our grand total when we're finished adding it all up
 end
-def small_adj!(key)                                                 # this function makes small random adjustments to the key when we've hill climbed our way into a dead end
+# this function makes small random adjustments to the key when we've hill
+# climbed our way into a dead end
+#  Parameters:
+# * key = A hash that represents the current translation mapping from ciphertext
+#   to plaintext
+#  Return Value:
+# * none
+def small_adj!(key)
     for i in 0...rand(5)                                            # pick a random number of changes to make
         j = rand(26)                                                # now pick two random letters in the alphabet to swap
         k = rand(26)
@@ -38,8 +58,16 @@ def small_adj!(key)                                                 # this funct
         end
     end
 end
-def plaintext(ciphertext, key)                                      # This function will return the decoded ciphertext using a given key to do the decoding
+# This function will return the decoded ciphertext using a given key to do the
+# decoding
+#  Parameters:
+# * ciphertext = A string that represents the ciphertext
+# * key = A hash that represents how to translate the ciphertext into
+#   plaintext
+#  Return Value:
+# * Returns the deciphered plaintext according to the key that was supplied.
+def plaintext(ciphertext, key)
     return_string = String.new                                      # create a return string
     for x in 0...ciphertext.length                                  # loop through the ciphertext
@@ -47,8 +75,13 @@ def plaintext(ciphertext, key)                                      # This funct
     end
     return return_string                                            # return the answer
 end
-def randomize!(key)                                                 # completely randomize the key, ie start over from scratch
+# completely randomize the key, ie start over from scratch
+#   Parameters:
+#       key = key as a Hash that needs to be randomized
+#   Return Value:
+#       none
+def randomize!(key)
     array = Array.new                                               # create an array of letters to pick from
     for x in 0...26
@@ -62,52 +95,80 @@ def randomize!(key)                                                 # completely
     end
 end
-print "best overall = ", score(ciphertext), " : best score = ", score(ciphertext), "\n" #print the original ciphertext
-puts ciphertext.gsub(/(.....)/, '\1 ')
-randomize!(key)                                                     # randomize the key
-best_score=score(ciphertext);                                       # set the best score to the score of the ciphertext
-best_overall=best_score-1;                                          # set the best overall score to the best score -1
-num_small_adjusts=0;                                                # set the number of small adjustments to 0
+# This function is the main entry point for this program, it is responsible for
+# implementing the main algorithm that solves the simple substitution cipher.
+# It will not return.  The only way to quite out of this function at present is
+# to hit CTRL-C.
+#   Parameters:
+#       ciphertext = the ciphertext that you are trying to decipher
+#   Return Value:
+#       none (presently the function never returns)
+def substitution_solver(ciphertext)
-loop do                                                             # loop forever
-    best_adj = best_score                                           # set the best adjustment to the current best score
+    ciphertext.gsub!(/[^a-zA-Z]/, "").upcase!                       # get rid of any non-alphabetic characters
-    for i in 0...26                                                 # loop through all possible "trivial" letter replacements
-        for j in i...26                                             # in the key looking for the best swap.  This in effect is
-            test_key = key.dup                                      # the so called "Hill Climbing" part of our program
-            temp = test_key[(i+65).chr]
-            test_key[(i+65).chr] = test_key[(j+65).chr]
-            test_key[(j+65).chr] = temp
-            sc = score(plaintext(ciphertext, test_key))             # score the change we've made
-            if sc > best_adj                                        # if it's better than any so far
-                best_adj=sc                                         # then record the change so we can apply it later if it
-                best_i = i                                          # turns out to be the best one
-                best_j = j
-            end
-        end
+    key = Hash.new                                                  # Create a hash that will represent the translation key
+    $dictionary = Hash.new(0)                                       # The dictionary of tetragraph frequencies
+    File.open("english.dic") do |f|                                 # Open the saved tetragraph information
+        $dictionary = Marshal.load(f)                               # And load this information into our dictionary
     end
-    if best_adj > best_score                                        # if we found an adjustment that improves the best score
-        temp = key[(best_i+65).chr]                                 # then apply that adjustment to the key
-        key[(best_i+65).chr] = key[(best_j+65).chr]
-        key[(best_j+65).chr] = temp
-        best_score = best_adj
-        if best_score > best_overall                                # if that adjustment is the best overall
-            num_small_adjusts = 0                                   # then reset the number of small adjusts counter
-            best_overall = best_score                               # set this new score as the best overall
-            print "best overall = ", best_overall, " : best score = ", best_score, " : iteration = #{$iteration}\n"
-            puts plaintext(ciphertext, key).gsub(/(.....)/, '\1 ')  # and print our new found best overall value
+    print "best overall = ", score(ciphertext), " : best score = ", score(ciphertext), "\n" #print the original ciphertext
+    puts ciphertext.gsub(/(.....)/, '\1 ')
+    randomize!(key)                                                 # randomize the key
+    best_score=score(ciphertext);                                   # set the best score to the score of the ciphertext
+    best_overall=best_score-1;                                      # set the best overall score to the best score -1
+    num_small_adjusts=0;                                            # set the number of small adjustments to 0
+    loop do                                                         # loop forever
+        best_adj = best_score                                       # set the best adjustment to the current best score
+        for i in 0...26                                             # loop through all possible "trivial" letter replacements
+            for j in i...26                                         # in the key looking for the best swap.  This in effect is
+                test_key = key.dup                                  # the so called "Hill Climbing" part of our program
+                temp = test_key[(i+65).chr]
+                test_key[(i+65).chr] = test_key[(j+65).chr]
+                test_key[(j+65).chr] = temp
+                sc = score(plaintext(ciphertext, test_key))         # score the change we've made
+                if sc > best_adj                                    # if it's better than any so far
+                    best_adj=sc                                     # then record the change so we can apply it later if it
+                    best_i = i                                      # turns out to be the best one
+                    best_j = j
+                end
+            end
         end
-    else                                                            # otherwise none of the adjustments raised are score
-        if num_small_adjusts < 10                                   # so make a small random adjustment to the key
-            small_adj!(key)                                         #  as long as we haven't already made to many small adjustments
-            num_small_adjusts += 1                                  # increment the number of small adjustments
-        else                                                        # otherwise we've made to many small adjustments, we're
-            randomize!(key)                                         #  probably not getting anywhere and need to start looking
-            num_small_adjusts = 0                                   #  somplace else, randomize the key and start climbing the
-        end                                                         #  hill again
-        best_score=score(plaintext(ciphertext, key))                # set the best score to either the small adjustment value or the new randomized string value depending on what we did above.
-     end
+        if best_adj > best_score                                    # if we found an adjustment that improves the best score
+            temp = key[(best_i+65).chr]                             # then apply that adjustment to the key
+            key[(best_i+65).chr] = key[(best_j+65).chr]
+            key[(best_j+65).chr] = temp
+            best_score = best_adj
+            if best_score > best_overall                            # if that adjustment is the best overall
+                num_small_adjusts = 0                               # then reset the number of small adjusts counter
+                best_overall = best_score                           # set this new score as the best overall
+                print "best overall = ", best_overall, " : best score = ", best_score, " : iteration = #{$iteration}\n"
+                puts plaintext(ciphertext, key).gsub(/(.....)/, '\1 ') # and print our new found best overall value
+            end
+        else                                                        # otherwise none of the adjustments raised are score
+            if num_small_adjusts < 10                               # so make a small random adjustment to the key
+                small_adj!(key)                                     #  as long as we haven't already made to many small adjustments
+                num_small_adjusts += 1                              # increment the number of small adjustments
+            else                                                    # otherwise we've made to many small adjustments, we're
+                randomize!(key)                                     #  probably not getting anywhere and need to start looking
+                num_small_adjusts = 0                               #  somplace else, randomize the key and start climbing the
+            end                                                     #  hill again
+            best_score=score(plaintext(ciphertext, key))            # set the best score to either the small adjustment value or the new randomized string value depending on what we did above.
+         end
+    end
+end
+ciphertext = String.new
+File::readlines(ARGV[0]).each do |line|                             # Grab the input from the standard input
+    ciphertext << line
 end
+substitution_solver(ciphertext)                                     # start the program on it's main loop

metadata CHANGED Viewed

@@ -3,12 +3,12 @@ rubygems_version: 0.8.10
 specification_version: 1
 name: substitution_solver
 version: !ruby/object:Gem::Version
-  version: 0.5.0
-date: 2005-11-09
+  version: 0.5.1
+date: 2005-11-17
 summary: "Program for solving mono-alphabetic simple substitution ciphers, (as in
   cryptoquotes), without word lengths."
 require_paths:
-  - lib
+  - "."
 email: pfharlock@yahoo.com
 homepage:
 rubyforge_project:
@@ -16,7 +16,7 @@ description:
 autorequire:
 default_executable:
 bindir: "."
-has_rdoc: false
+has_rdoc: true
 required_ruby_version: !ruby/object:Gem::Version::Requirement
   requirements:
     -