diff options
Diffstat (limited to 'markov-serialise.rb')
-rwxr-xr-x | markov-serialise.rb | 27 |
1 files changed, 0 insertions, 27 deletions
diff --git a/markov-serialise.rb b/markov-serialise.rb deleted file mode 100755 index 1199453..0000000 --- a/markov-serialise.rb +++ /dev/null @@ -1,27 +0,0 @@ -#!/usr/bin/env ruby - -CHUNK = ARGV[1].to_i - -stats = {"__SETTINGS__" => {"__CHUNK__" => CHUNK}} - -words = File.readlines(ARGV[0]) - .map(&:split) - .flatten - -(0 .. (words.length - CHUNK - CHUNK)).each do |i| - k = words[i...(i+CHUNK)] - v = words[(i+CHUNK)] - if stats.include?(k) then - t = stats[k] - if t.include?(v) then - t[v] += 1 - else - t[v] = 1 - end - else - stats[k] = Hash.new - stats[k][v] = 1 - end -end - -File.new(ARGV[2], "w").print(Marshal::dump(stats)) |