2010-12-13 20:22:51 +00:00
|
|
|
#!/usr/bin/ruby
|
|
|
|
|
2010-12-13 21:25:23 +00:00
|
|
|
STDOUT.sync = true
|
|
|
|
|
|
|
|
unless defined? Mongo
|
|
|
|
require File.join(File.dirname(__FILE__), '..', '..', 'lib', 'mongo')
|
|
|
|
end
|
2010-12-13 20:22:51 +00:00
|
|
|
|
|
|
|
class ReplSetManager
|
|
|
|
|
2010-12-14 18:14:45 +00:00
|
|
|
attr_accessor :host, :start_port, :ports, :name, :mongods
|
2010-12-13 21:25:23 +00:00
|
|
|
|
2010-12-13 20:22:51 +00:00
|
|
|
def initialize(opts={})
|
|
|
|
@start_port = opts[:start_port] || 30000
|
2010-12-13 21:25:23 +00:00
|
|
|
@ports = []
|
2010-12-13 20:22:51 +00:00
|
|
|
@name = opts[:name] || 'replica-set-foo'
|
|
|
|
@host = opts[:host] || 'localhost'
|
|
|
|
@retries = opts[:retries] || 60
|
|
|
|
@config = {"_id" => @name, "members" => []}
|
|
|
|
@path = File.join(File.expand_path(File.dirname(__FILE__)), "data")
|
|
|
|
|
2010-12-14 20:47:18 +00:00
|
|
|
@arbiter_count = opts[:arbiter_count] || 2
|
|
|
|
@secondary_count = opts[:secondary_count] || 1
|
|
|
|
@passive_count = opts[:passive_count] || 1
|
2010-12-14 18:14:45 +00:00
|
|
|
@primary_count = 1
|
|
|
|
|
|
|
|
@count = @primary_count + @passive_count + @arbiter_count + @secondary_count
|
|
|
|
if @count > 7
|
|
|
|
raise StandardError, "Cannot create a replica set with #{node_count} nodes. 7 is the max."
|
|
|
|
end
|
|
|
|
|
2010-12-13 20:22:51 +00:00
|
|
|
@mongods = {}
|
|
|
|
end
|
|
|
|
|
|
|
|
def start_set
|
2010-12-14 20:47:18 +00:00
|
|
|
puts "** Starting a replica set with #{@count} nodes"
|
2010-12-13 20:22:51 +00:00
|
|
|
|
|
|
|
system("killall mongod")
|
2010-12-13 21:25:23 +00:00
|
|
|
|
2010-12-14 18:14:45 +00:00
|
|
|
n = 0
|
|
|
|
(@primary_count + @secondary_count).times do |n|
|
|
|
|
init_node(n)
|
|
|
|
n += 1
|
|
|
|
end
|
|
|
|
|
|
|
|
@passive_count.times do
|
|
|
|
init_node(n) do |attrs|
|
|
|
|
attrs['priority'] = 0
|
2010-12-13 20:22:51 +00:00
|
|
|
end
|
2010-12-14 18:14:45 +00:00
|
|
|
n += 1
|
|
|
|
end
|
2010-12-13 20:22:51 +00:00
|
|
|
|
2010-12-14 18:14:45 +00:00
|
|
|
@arbiter_count.times do
|
|
|
|
init_node(n) do |attrs|
|
|
|
|
attrs['arbiterOnly'] = true
|
|
|
|
end
|
|
|
|
n += 1
|
2010-12-13 20:22:51 +00:00
|
|
|
end
|
|
|
|
|
2010-12-14 18:14:45 +00:00
|
|
|
initiate
|
2010-12-13 20:22:51 +00:00
|
|
|
ensure_up
|
|
|
|
end
|
|
|
|
|
2011-02-02 16:26:31 +00:00
|
|
|
def cleanup_set
|
|
|
|
system("killall mongod")
|
|
|
|
@count.times do |n|
|
|
|
|
system("rm -rf #{@mongods[n]['db_path']}")
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2010-12-14 18:14:45 +00:00
|
|
|
def init_node(n)
|
|
|
|
@mongods[n] ||= {}
|
|
|
|
port = @start_port + n
|
|
|
|
@ports << port
|
|
|
|
@mongods[n]['port'] = port
|
|
|
|
@mongods[n]['db_path'] = get_path("rs-#{port}")
|
|
|
|
@mongods[n]['log_path'] = get_path("log-#{port}")
|
|
|
|
system("rm -rf #{@mongods[n]['db_path']}")
|
|
|
|
system("mkdir -p #{@mongods[n]['db_path']}")
|
|
|
|
|
2011-02-02 16:26:31 +00:00
|
|
|
@mongods[n]['start'] = start_cmd(n)
|
2010-12-14 18:14:45 +00:00
|
|
|
start(n)
|
|
|
|
|
|
|
|
member = {'_id' => n, 'host' => "#{@host}:#{@mongods[n]['port']}"}
|
|
|
|
|
|
|
|
if block_given?
|
|
|
|
custom_attrs = {}
|
|
|
|
yield custom_attrs
|
|
|
|
member.merge!(custom_attrs)
|
|
|
|
@mongods[n].merge!(custom_attrs)
|
|
|
|
end
|
|
|
|
|
|
|
|
@config['members'] << member
|
|
|
|
end
|
|
|
|
|
2011-02-02 16:26:31 +00:00
|
|
|
def start_cmd(n)
|
|
|
|
@mongods[n]['start'] = "mongod --replSet #{@name} --logpath '#{@mongods[n]['log_path']}' " +
|
|
|
|
" --dbpath #{@mongods[n]['db_path']} --port #{@mongods[n]['port']} --fork"
|
|
|
|
end
|
|
|
|
|
2010-12-13 20:22:51 +00:00
|
|
|
def kill(node)
|
2010-12-14 20:47:18 +00:00
|
|
|
pid = @mongods[node]['pid']
|
|
|
|
puts "** Killing node with pid #{pid} at port #{@mongods[node]['port']}"
|
2010-12-13 20:22:51 +00:00
|
|
|
system("kill -2 #{@mongods[node]['pid']}")
|
|
|
|
@mongods[node]['up'] = false
|
|
|
|
sleep(1)
|
|
|
|
end
|
|
|
|
|
2010-12-13 21:25:23 +00:00
|
|
|
def kill_primary
|
|
|
|
node = get_node_with_state(1)
|
|
|
|
kill(node)
|
|
|
|
return node
|
|
|
|
end
|
|
|
|
|
2010-12-14 18:14:45 +00:00
|
|
|
# Note that we have to rescue a connection failure
|
|
|
|
# when we run the StepDown command because that
|
|
|
|
# command will close the connection.
|
|
|
|
def step_down_primary
|
|
|
|
primary = get_node_with_state(1)
|
|
|
|
con = get_connection(primary)
|
|
|
|
begin
|
|
|
|
con['admin'].command({'replSetStepDown' => 90})
|
|
|
|
rescue Mongo::ConnectionFailure
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2010-12-13 21:25:23 +00:00
|
|
|
def kill_secondary
|
|
|
|
node = get_node_with_state(2)
|
|
|
|
kill(node)
|
|
|
|
return node
|
|
|
|
end
|
|
|
|
|
2010-12-14 18:14:45 +00:00
|
|
|
def restart_killed_nodes
|
|
|
|
nodes = @mongods.keys.select do |key|
|
|
|
|
@mongods[key]['up'] == false
|
|
|
|
end
|
|
|
|
|
|
|
|
nodes.each do |node|
|
|
|
|
start(node)
|
|
|
|
end
|
|
|
|
|
|
|
|
ensure_up
|
|
|
|
end
|
|
|
|
|
|
|
|
def get_node_from_port(port)
|
|
|
|
@mongods.keys.detect { |key| @mongods[key]['port'] == port }
|
|
|
|
end
|
|
|
|
|
2010-12-13 20:22:51 +00:00
|
|
|
def start(node)
|
|
|
|
system(@mongods[node]['start'])
|
|
|
|
@mongods[node]['up'] = true
|
2010-12-14 20:47:18 +00:00
|
|
|
sleep(0.5)
|
2010-12-13 20:22:51 +00:00
|
|
|
@mongods[node]['pid'] = File.open(File.join(@mongods[node]['db_path'], 'mongod.lock')).read.strip
|
|
|
|
end
|
|
|
|
alias :restart :start
|
|
|
|
|
|
|
|
def ensure_up
|
2010-12-14 20:47:18 +00:00
|
|
|
print "** Ensuring members are up..."
|
2010-12-13 20:22:51 +00:00
|
|
|
|
2010-12-15 20:07:01 +00:00
|
|
|
attempt do
|
2010-12-14 18:14:45 +00:00
|
|
|
con = get_connection
|
|
|
|
status = con['admin'].command({'replSetGetStatus' => 1})
|
2010-12-13 21:25:23 +00:00
|
|
|
print "."
|
2010-12-14 22:38:52 +00:00
|
|
|
if status['members'].all? { |m| m['health'] == 1 && [1, 2, 7].include?(m['state']) } &&
|
2010-12-14 18:14:45 +00:00
|
|
|
status['members'].any? { |m| m['state'] == 1 }
|
2010-12-14 20:47:18 +00:00
|
|
|
print "all members up!\n\n"
|
2010-12-13 21:25:23 +00:00
|
|
|
return status
|
2010-12-13 20:22:51 +00:00
|
|
|
else
|
|
|
|
raise Mongo::OperationFailure
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2010-12-14 18:14:45 +00:00
|
|
|
def primary
|
|
|
|
nodes = get_all_host_pairs_with_state(1)
|
|
|
|
nodes.empty? ? nil : nodes[0]
|
|
|
|
end
|
|
|
|
|
|
|
|
def secondaries
|
|
|
|
get_all_host_pairs_with_state(2)
|
|
|
|
end
|
|
|
|
|
|
|
|
def arbiters
|
|
|
|
get_all_host_pairs_with_state(7)
|
|
|
|
end
|
|
|
|
|
2010-12-13 20:22:51 +00:00
|
|
|
private
|
|
|
|
|
2010-12-14 18:14:45 +00:00
|
|
|
def initiate
|
|
|
|
con = get_connection
|
2010-12-13 20:22:51 +00:00
|
|
|
|
2010-12-15 20:07:01 +00:00
|
|
|
attempt do
|
2010-12-14 18:14:45 +00:00
|
|
|
con['admin'].command({'replSetInitiate' => @config})
|
2010-12-13 20:22:51 +00:00
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2010-12-13 21:25:23 +00:00
|
|
|
def get_node_with_state(state)
|
|
|
|
status = ensure_up
|
|
|
|
node = status['members'].detect {|m| m['state'] == state}
|
|
|
|
if node
|
|
|
|
host_port = node['name'].split(':')
|
|
|
|
port = host_port[1] ? host_port[1].to_i : 27017
|
|
|
|
key = @mongods.keys.detect {|key| @mongods[key]['port'] == port}
|
|
|
|
return key
|
|
|
|
else
|
|
|
|
return false
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2010-12-14 18:14:45 +00:00
|
|
|
def get_all_host_pairs_with_state(state)
|
|
|
|
status = ensure_up
|
|
|
|
nodes = status['members'].select {|m| m['state'] == state}
|
|
|
|
nodes.map do |node|
|
|
|
|
host_port = node['name'].split(':')
|
|
|
|
port = host_port[1] ? host_port[1].to_i : 27017
|
|
|
|
[host, port]
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
def get_connection(node=nil)
|
2010-12-15 20:07:01 +00:00
|
|
|
con = attempt do
|
2010-12-14 18:14:45 +00:00
|
|
|
if !node
|
|
|
|
node = @mongods.keys.detect {|key| !@mongods[key]['arbiterOnly'] && @mongods[key]['up'] }
|
|
|
|
end
|
|
|
|
con = Mongo::Connection.new(@host, @mongods[node]['port'], :slave_ok => true)
|
2010-12-13 20:22:51 +00:00
|
|
|
end
|
|
|
|
|
2010-12-14 18:14:45 +00:00
|
|
|
return con
|
2010-12-13 20:22:51 +00:00
|
|
|
end
|
|
|
|
|
|
|
|
def get_path(name)
|
2010-12-13 21:25:23 +00:00
|
|
|
File.join(@path, name)
|
2010-12-13 20:22:51 +00:00
|
|
|
end
|
|
|
|
|
2010-12-15 20:07:01 +00:00
|
|
|
def attempt
|
2010-12-13 20:22:51 +00:00
|
|
|
raise "No block given!" unless block_given?
|
|
|
|
count = 0
|
|
|
|
|
|
|
|
while count < @retries do
|
|
|
|
begin
|
2010-12-14 18:14:45 +00:00
|
|
|
return yield
|
2010-12-15 20:07:01 +00:00
|
|
|
rescue Mongo::OperationFailure, Mongo::ConnectionFailure
|
2010-12-13 20:22:51 +00:00
|
|
|
sleep(1)
|
|
|
|
count += 1
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
raise exception
|
|
|
|
end
|
|
|
|
|
|
|
|
end
|