couchrest_model/examples/word_count/markov

39 lines
952 B
Text
Raw Normal View History

#!/usr/bin/env ruby
2008-06-02 09:34:04 -07:00
require File.expand_path(File.dirname(__FILE__)) + '/../../couchrest'
2008-12-14 12:05:02 +01:00
cr = CouchRest.new("http://127.0.0.1:5984")
2008-06-02 09:34:04 -07:00
@db = cr.database('word-count-example')
@word_memoizer = {}
def probable_follower_for(word)
@word_memoizer[word] ||= @db.view('markov/chain-reduce', :startkey => [word,nil], :endkey => [word,{}],:group_level => 2)
# puts
# puts "search #{word} #{wprobs[word]['rows'].length}"
# @word_memoizer[word]['rows'].sort_by{|r|r['value']}.each{|r|puts [r['value'],r['key']].inspect}
rows = @word_memoizer[word]['rows'].select{|r|(r['key'][1]!='')}.sort_by{|r|r['value']}
row = rows[(-1*[rows.length,5].min)..-1].sort_by{rand}[0]
row ? row['key'][1] : nil
end
word = ARGV[0]
words = [word]
while word
$stdout.print ' ' if words.length > 1
$stdout.print word
$stdout.flush
2008-06-02 09:34:04 -07:00
word = probable_follower_for(word)
words << word
end
$stdout.print '.'
$stdout.flush
puts
# `say #{words.join(' ')}`