RUBY-120 configurable batch size; begin 0.20.2
This commit is contained in:
parent
49bc88c4b3
commit
b9f579876c
70
bin/batch_size_benchmark
Executable file
70
bin/batch_size_benchmark
Executable file
@ -0,0 +1,70 @@
|
|||||||
|
#!/usr/bin/env ruby
|
||||||
|
#$LOAD_PATH[0,0] = File.join(File.dirname(__FILE__), '..', 'lib')
|
||||||
|
#
|
||||||
|
# Note: Ruby 1.9 is faster than 1.8, as expected.
|
||||||
|
# This suite will be run against the installed version of ruby-mongo-driver.
|
||||||
|
# The c-extension, bson_ext, will be used if installed.
|
||||||
|
|
||||||
|
require 'rubygems'
|
||||||
|
require 'mongo'
|
||||||
|
|
||||||
|
large = {
|
||||||
|
'base_url' => 'http://www.example.com/test-me',
|
||||||
|
'total_word_count' => 6743,
|
||||||
|
'access_time' => Time.now,
|
||||||
|
'meta_tags' => {
|
||||||
|
'description' => 'i am a long description string',
|
||||||
|
'author' => 'Holly Man',
|
||||||
|
'dynamically_created_meta_tag' => 'who know\n what'
|
||||||
|
},
|
||||||
|
'page_structure' => {
|
||||||
|
'counted_tags' => 3450,
|
||||||
|
'no_of_js_attached' => 10,
|
||||||
|
'no_of_images' => 6
|
||||||
|
},
|
||||||
|
'harvested_words' => ['10gen','web','open','source','application','paas',
|
||||||
|
'platform-as-a-service','technology','helps',
|
||||||
|
'developers','focus','building','mongodb','mongo'] * 20
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
con = Mongo::Connection.new
|
||||||
|
|
||||||
|
db = con['benchmark']
|
||||||
|
col = db['bigdocs']
|
||||||
|
|
||||||
|
col.remove()
|
||||||
|
|
||||||
|
puts "Inserting 100,000 large documents..."
|
||||||
|
|
||||||
|
def get_batch(large)
|
||||||
|
batch = []
|
||||||
|
100.times do
|
||||||
|
batch << large.dup
|
||||||
|
end
|
||||||
|
batch
|
||||||
|
end
|
||||||
|
|
||||||
|
1000.times do
|
||||||
|
col.insert(get_batch(large))
|
||||||
|
end
|
||||||
|
GC.start
|
||||||
|
|
||||||
|
t1 = Time.now
|
||||||
|
cursor = col.find({}, :batch_size => 0)
|
||||||
|
200.times do
|
||||||
|
cursor.next_document
|
||||||
|
end
|
||||||
|
t2 = Time.now
|
||||||
|
puts "Database decides batch size: #{t2 - t1}"
|
||||||
|
|
||||||
|
|
||||||
|
t1 = Time.now
|
||||||
|
cursor = col.find({}, :batch_size => 100)
|
||||||
|
200.times do
|
||||||
|
cursor.next_document
|
||||||
|
end
|
||||||
|
t2 = Time.now
|
||||||
|
puts "Batch size of 100: #{t2 - t1}"
|
||||||
|
|
||||||
|
|
@ -14,4 +14,4 @@
|
|||||||
* limitations under the License.
|
* limitations under the License.
|
||||||
*/
|
*/
|
||||||
|
|
||||||
#define VERSION "0.20.1"
|
#define VERSION "0.20.2"
|
||||||
|
@ -1,7 +1,7 @@
|
|||||||
$:.unshift(File.join(File.dirname(__FILE__), '..', 'lib'))
|
$:.unshift(File.join(File.dirname(__FILE__), '..', 'lib'))
|
||||||
|
|
||||||
module BSON
|
module BSON
|
||||||
VERSION = "0.20.1"
|
VERSION = "0.20.2"
|
||||||
def self.serialize(obj, check_keys=false, move_id=false)
|
def self.serialize(obj, check_keys=false, move_id=false)
|
||||||
BSON_CODER.serialize(obj, check_keys, move_id)
|
BSON_CODER.serialize(obj, check_keys, move_id)
|
||||||
end
|
end
|
||||||
|
@ -1,7 +1,7 @@
|
|||||||
$:.unshift(File.join(File.dirname(__FILE__), '..', 'lib'))
|
$:.unshift(File.join(File.dirname(__FILE__), '..', 'lib'))
|
||||||
|
|
||||||
module Mongo
|
module Mongo
|
||||||
VERSION = "0.20.1"
|
VERSION = "0.20.2"
|
||||||
end
|
end
|
||||||
|
|
||||||
module Mongo
|
module Mongo
|
||||||
@ -21,6 +21,8 @@ module Mongo
|
|||||||
|
|
||||||
OP_QUERY_SLAVE_OK = 4
|
OP_QUERY_SLAVE_OK = 4
|
||||||
OP_QUERY_NO_CURSOR_TIMEOUT = 16
|
OP_QUERY_NO_CURSOR_TIMEOUT = 16
|
||||||
|
|
||||||
|
DEFAULT_BATCH_SIZE = 100
|
||||||
end
|
end
|
||||||
|
|
||||||
end
|
end
|
||||||
|
@ -120,6 +120,8 @@ module Mongo
|
|||||||
# @option opts [Boolean] :snapshot ('false') if true, snapshot mode will be used for this query.
|
# @option opts [Boolean] :snapshot ('false') if true, snapshot mode will be used for this query.
|
||||||
# Snapshot mode assures no duplicates are returned, or objects missed, which were preset at both the start and
|
# Snapshot mode assures no duplicates are returned, or objects missed, which were preset at both the start and
|
||||||
# end of the query's execution. For details see http://www.mongodb.org/display/DOCS/How+to+do+Snapshotting+in+the+Mongo+Database
|
# end of the query's execution. For details see http://www.mongodb.org/display/DOCS/How+to+do+Snapshotting+in+the+Mongo+Database
|
||||||
|
# @option opts [Boolean] :batch_size (100) the number of documents to returned by the database per GETMORE operation. A value of 0
|
||||||
|
# will let the database server decide how many results to returns. This option can be ignored for most use cases.
|
||||||
# @option opts [Boolean] :timeout ('true') when +true+, the returned cursor will be subject to
|
# @option opts [Boolean] :timeout ('true') when +true+, the returned cursor will be subject to
|
||||||
# the normal cursor timeout behavior of the mongod process. When +false+, the returned cursor will never timeout. Note
|
# the normal cursor timeout behavior of the mongod process. When +false+, the returned cursor will never timeout. Note
|
||||||
# that disabling timeout will only work when #find is invoked with a block. This is to prevent any inadvertant failure to
|
# that disabling timeout will only work when #find is invoked with a block. This is to prevent any inadvertant failure to
|
||||||
@ -140,6 +142,7 @@ module Mongo
|
|||||||
sort = opts.delete(:sort)
|
sort = opts.delete(:sort)
|
||||||
hint = opts.delete(:hint)
|
hint = opts.delete(:hint)
|
||||||
snapshot = opts.delete(:snapshot)
|
snapshot = opts.delete(:snapshot)
|
||||||
|
batch_size = opts.delete(:batch_size)
|
||||||
if opts[:timeout] == false && !block_given?
|
if opts[:timeout] == false && !block_given?
|
||||||
raise ArgumentError, "Timeout can be set to false only when #find is invoked with a block."
|
raise ArgumentError, "Timeout can be set to false only when #find is invoked with a block."
|
||||||
end
|
end
|
||||||
@ -152,7 +155,7 @@ module Mongo
|
|||||||
raise RuntimeError, "Unknown options [#{opts.inspect}]" unless opts.empty?
|
raise RuntimeError, "Unknown options [#{opts.inspect}]" unless opts.empty?
|
||||||
|
|
||||||
cursor = Cursor.new(self, :selector => selector, :fields => fields, :skip => skip, :limit => limit,
|
cursor = Cursor.new(self, :selector => selector, :fields => fields, :skip => skip, :limit => limit,
|
||||||
:order => sort, :hint => hint, :snapshot => snapshot, :timeout => timeout)
|
:order => sort, :hint => hint, :snapshot => snapshot, :timeout => timeout, :batch_size => batch_size)
|
||||||
if block_given?
|
if block_given?
|
||||||
yield cursor
|
yield cursor
|
||||||
cursor.close()
|
cursor.close()
|
||||||
|
@ -47,6 +47,7 @@ module Mongo
|
|||||||
@timeout = options[:timeout] || false
|
@timeout = options[:timeout] || false
|
||||||
@explain = options[:explain]
|
@explain = options[:explain]
|
||||||
@socket = options[:socket]
|
@socket = options[:socket]
|
||||||
|
@batch_size = options[:batch_size] || Mongo::Constants::DEFAULT_BATCH_SIZE
|
||||||
|
|
||||||
@full_collection_name = "#{@collection.db.name}.#{@collection.name}"
|
@full_collection_name = "#{@collection.db.name}.#{@collection.name}"
|
||||||
@cache = []
|
@cache = []
|
||||||
@ -317,8 +318,8 @@ module Mongo
|
|||||||
db_name = @admin ? 'admin' : @db.name
|
db_name = @admin ? 'admin' : @db.name
|
||||||
BSON::BSON_RUBY.serialize_cstr(message, "#{db_name}.#{@collection.name}")
|
BSON::BSON_RUBY.serialize_cstr(message, "#{db_name}.#{@collection.name}")
|
||||||
|
|
||||||
# Number of results to return; db decides for now.
|
# Number of results to return.
|
||||||
message.put_int(0)
|
message.put_int(@batch_size)
|
||||||
|
|
||||||
# Cursor id.
|
# Cursor id.
|
||||||
message.put_long(@cursor_id)
|
message.put_long(@cursor_id)
|
||||||
|
Loading…
Reference in New Issue
Block a user