More memory profiling

This commit is contained in:
Jaiden Mispy 2014-10-18 22:21:50 -07:00
parent b7f67ec0a6
commit 228e0caa65
7 changed files with 49 additions and 12 deletions

View file

@ -43,7 +43,7 @@ module Ebooks
config.oauth_token_secret = @oauth_token_secret config.oauth_token_secret = @oauth_token_secret
end end
Twitter.configure do |config| @twitter = Twitter::REST::Client.new do |config|
config.consumer_key = @consumer_key config.consumer_key = @consumer_key
config.consumer_secret = @consumer_secret config.consumer_secret = @consumer_secret
config.oauth_token = @oauth_token config.oauth_token = @oauth_token
@ -52,7 +52,6 @@ module Ebooks
needs_stream = [@on_follow, @on_message, @on_mention, @on_timeline].any? {|e| !e.nil?} needs_stream = [@on_follow, @on_message, @on_mention, @on_timeline].any? {|e| !e.nil?}
@twitter = Twitter::Client.new
@stream = TweetStream::Client.new if needs_stream @stream = TweetStream::Client.new if needs_stream
end end
@ -163,7 +162,7 @@ module Ebooks
log "Tweeting #{args.inspect}" log "Tweeting #{args.inspect}"
@twitter.update(*args) @twitter.update(*args)
end end
# could easily just be *args however the separation keeps it clean. # could easily just be *args however the separation keeps it clean.
def pictweet(txt, pic, *args) def pictweet(txt, pic, *args)
log "Tweeting #{txt.inspect} - #{pic} #{args}" log "Tweeting #{txt.inspect} - #{pic} #{args}"

View file

@ -79,8 +79,8 @@ module Ebooks
@sentences = mass_tokenize(text) @sentences = mass_tokenize(text)
@mentions = mass_tokenize(mention_text) @mentions = mass_tokenize(mention_text)
#log "Ranking keywords" log "Ranking keywords"
#@keywords = NLP.keywords(@sentences) @keywords = NLP.keywords(@sentences)
self self
end end

BIN
spec/data/0xabad1dea.model Normal file

Binary file not shown.

37
spec/memprof.rb Normal file
View file

@ -0,0 +1,37 @@
require 'objspace'
module MemoryUsage
MemoryReport = Struct.new(:total_memsize)
def self.full_gc
GC.start(full_mark: true)
end
def self.report(&block)
rvalue_size = GC::INTERNAL_CONSTANTS[:RVALUE_SIZE]
full_gc
GC.disable
total_memsize = 0
generation = nil
ObjectSpace.trace_object_allocations do
generation = GC.count
block.call
end
ObjectSpace.each_object do |obj|
next unless generation == ObjectSpace.allocation_generation(obj)
memsize = ObjectSpace.memsize_of(obj) + rvalue_size
# compensate for API bug
memsize = rvalue_size if memsize > 100_000_000_000
total_memsize += memsize
end
GC.enable
full_gc
return MemoryReport.new(total_memsize)
end
end

View file

@ -1,14 +1,14 @@
require 'spec_helper' require 'spec_helper'
require 'memory_profiler' require 'memory_profiler'
def Process.rss; `ps -o rss= -p #{Process.pid}`.chomp.to_i; end
describe Ebooks::Model do describe Ebooks::Model do
it "does not use a ridiculous amount of memory" do it "does not use a ridiculous amount of memory" do
RubyProf.start report = MemoryUsage.report do
Ebooks::Model.consume(path("data/0xabad1dea.json")) model = Ebooks::Model.consume(path("data/0xabad1dea.json"))
result = RubyProf.stop end
require 'pry'; binding.pry expect(report.total_memsize).to be < 1000000000
expect(report.total_retained).to be < 100000
end end
end end

View file

@ -1,4 +1,5 @@
require 'twitter_ebooks' require 'twitter_ebooks'
require_relative 'memprof'
def path(relpath) def path(relpath)
File.join(File.dirname(__FILE__), relpath) File.join(File.dirname(__FILE__), relpath)

View file

@ -16,7 +16,7 @@ Gem::Specification.new do |gem|
gem.version = Ebooks::VERSION gem.version = Ebooks::VERSION
gem.add_development_dependency 'rspec' gem.add_development_dependency 'rspec'
gem.add_development_dependency 'ruby-prof' gem.add_development_dependency 'memory_profiler'
gem.add_development_dependency 'pry-byebug' gem.add_development_dependency 'pry-byebug'