Bot anti-bot measures
We assume a user is a bot if it has 'ebooks' in the name or if it replies more than once in a 30-second window
This commit is contained in:
parent
8326fc19dd
commit
29beb23502
3 changed files with 209 additions and 67 deletions
|
@ -49,13 +49,56 @@ module Ebooks
|
|||
class ConfigurationError < Exception
|
||||
end
|
||||
|
||||
# UserInfo tracks some meta information for how much
|
||||
# we've interacted with a user, and how much they've responded
|
||||
# We track how many unprompted interactions the bot has had with
|
||||
# each user and start dropping them from mentions after two in a row
|
||||
class UserInfo
|
||||
attr_accessor :times_bugged, :times_responded
|
||||
def initialize
|
||||
self.times_bugged = 0
|
||||
self.times_responded = 0
|
||||
attr_reader :username
|
||||
attr_accessor :pester_count
|
||||
|
||||
def initialize(username)
|
||||
@username = username
|
||||
@pester_count = 0
|
||||
end
|
||||
|
||||
def can_pester?
|
||||
@pester_count < 2
|
||||
end
|
||||
end
|
||||
|
||||
# Represents a current "interaction state" with another user
|
||||
class Interaction
|
||||
attr_reader :userinfo, :received, :last_update
|
||||
|
||||
def initialize(userinfo)
|
||||
@userinfo = userinfo
|
||||
@received = []
|
||||
@last_update = Time.now
|
||||
end
|
||||
|
||||
def receive(tweet)
|
||||
@received << tweet
|
||||
@last_update = Time.now
|
||||
@userinfo.pester_count = 0
|
||||
end
|
||||
|
||||
# Make an informed guess as to whether this user is a bot
|
||||
# based on its username and reply speed
|
||||
def is_bot?
|
||||
if @received.length > 1
|
||||
if (@received[-1].created_at - @received[-2].created_at) < 30
|
||||
return true
|
||||
end
|
||||
end
|
||||
|
||||
@userinfo.username.include?("ebooks")
|
||||
end
|
||||
|
||||
def continue?
|
||||
if is_bot?
|
||||
true if @received.length < 2
|
||||
else
|
||||
true
|
||||
end
|
||||
end
|
||||
end
|
||||
|
||||
|
@ -80,13 +123,27 @@ module Ebooks
|
|||
STDOUT.flush
|
||||
end
|
||||
|
||||
def initialize
|
||||
def initialize(*args, &b)
|
||||
@username ||= nil
|
||||
@blacklist ||= []
|
||||
@delay_range ||= 0
|
||||
|
||||
@users ||= {}
|
||||
configure
|
||||
@interactions ||= {}
|
||||
configure(*args, &b)
|
||||
end
|
||||
|
||||
def userinfo(username)
|
||||
@users[username] ||= UserInfo.new(username)
|
||||
end
|
||||
|
||||
def interaction(username)
|
||||
if @interactions[username] &&
|
||||
Time.now - @interactions[username].last_update < 600
|
||||
@interactions[username]
|
||||
else
|
||||
@interactions[username] = Interaction.new(userinfo(username))
|
||||
end
|
||||
end
|
||||
|
||||
def make_client
|
||||
|
@ -112,18 +169,34 @@ module Ebooks
|
|||
meta = {}
|
||||
meta[:mentions] = ev.attrs[:entities][:user_mentions].map { |x| x[:screen_name] }
|
||||
|
||||
# To check if this is someone talking to us, ensure:
|
||||
# - The tweet mentions list contains our username
|
||||
# - The tweet is not being retweeted by somebody else
|
||||
# - Or soft-retweeted by somebody else
|
||||
meta[:mentions_bot] = meta[:mentions].map(&:downcase).include?(@username.downcase) && !ev.retweeted_status? && !ev.text.start_with?('RT ')
|
||||
|
||||
# Process mentions to figure out who to reply to
|
||||
reply_mentions = meta[:mentions].reject { |m| m.downcase == @username.downcase }
|
||||
reply_mentions = [ev.user.screen_name] + reply_mentions
|
||||
reply_mentions = reply_mentions.select { |username| userinfo(username).can_pester? }
|
||||
meta[:reply_mentions] = [ev.user.screen_name] + reply_mentions
|
||||
|
||||
# Don't reply to more than three users at a time
|
||||
if reply_mentions.length > 3
|
||||
log "Truncating reply_mentions to the first three users"
|
||||
reply_mentions = reply_mentions[0..2]
|
||||
end
|
||||
|
||||
meta[:reply_prefix] = reply_mentions.uniq.map { |m| '@'+m }.join(' ') + ' '
|
||||
meta[:reply_prefix] = meta[:reply_mentions].uniq.map { |m| '@'+m }.join(' ') + ' '
|
||||
|
||||
meta[:limit] = 140 - meta[:reply_prefix].length
|
||||
|
||||
mless = ev.text
|
||||
begin
|
||||
ev.attrs[:entities][:user_mentions].reverse.each do |entity|
|
||||
last = mless[entity[:indices][1]..-1]||''
|
||||
mless = mless[0...entity[:indices][0]] + last.strip
|
||||
end
|
||||
rescue Exception
|
||||
p ev.attrs[:entities][:user_mentions]
|
||||
p ev.text
|
||||
raise
|
||||
end
|
||||
meta[:mentionless] = mless
|
||||
|
||||
meta
|
||||
end
|
||||
|
||||
|
@ -150,29 +223,14 @@ module Ebooks
|
|||
|
||||
meta = calc_meta(ev)
|
||||
|
||||
mless = ev.text
|
||||
begin
|
||||
ev.attrs[:entities][:user_mentions].reverse.each do |entity|
|
||||
last = mless[entity[:indices][1]..-1]||''
|
||||
mless = mless[0...entity[:indices][0]] + last.strip
|
||||
end
|
||||
rescue Exception
|
||||
p ev.attrs[:entities][:user_mentions]
|
||||
p ev.text
|
||||
raise
|
||||
end
|
||||
meta[:mentionless] = mless
|
||||
|
||||
# To check if this is a mention, ensure:
|
||||
# - The tweet mentions list contains our username
|
||||
# - The tweet is not being retweeted by somebody else
|
||||
# - Or soft-retweeted by somebody else
|
||||
if meta[:mentions].map(&:downcase).include?(@username.downcase) && !ev.retweeted_status? && !ev.text.start_with?('RT ')
|
||||
if meta[:mentions_bot]
|
||||
log "Mention from @#{ev.user.screen_name}: #{ev.text}"
|
||||
interaction(ev.user.screen_name).receive(ev)
|
||||
fire(:mention, ev, meta)
|
||||
else
|
||||
fire(:timeline, ev, meta)
|
||||
end
|
||||
|
||||
elsif ev.is_a? Twitter::Streaming::DeletedTweet
|
||||
# pass
|
||||
else
|
||||
|
@ -242,9 +300,20 @@ module Ebooks
|
|||
elsif ev.is_a? Twitter::Tweet
|
||||
meta = calc_meta(ev)
|
||||
|
||||
return if blacklisted?(ev.user.screen_name)
|
||||
log "Replying to @#{ev.user.screen_name} with: #{text}"
|
||||
if blacklisted?(ev.user.screen_name)
|
||||
log "Not replying to blacklisted user @#{ev.user.screen_name}"
|
||||
return
|
||||
elsif !interaction(ev.user.screen_name).continue?
|
||||
log "Not replying to suspected bot @#{ev.user.screen_name}"
|
||||
return
|
||||
end
|
||||
|
||||
log "Replying to @#{ev.user.screen_name} with: #{meta[:reply_prefix] + text}"
|
||||
@twitter.update(meta[:reply_prefix] + text, in_reply_to_status_id: ev.id)
|
||||
|
||||
meta[:reply_mentions].each do |username|
|
||||
userinfo(username).pester_count += 1
|
||||
end
|
||||
else
|
||||
raise Exception("Don't know how to reply to a #{ev.class}")
|
||||
end
|
||||
|
|
134
spec/bot_spec.rb
134
spec/bot_spec.rb
|
@ -1,6 +1,7 @@
|
|||
require 'spec_helper'
|
||||
require 'memory_profiler'
|
||||
require 'tempfile'
|
||||
require 'timecop'
|
||||
|
||||
def Process.rss; `ps -o rss= -p #{Process.pid}`.chomp.to_i; end
|
||||
|
||||
|
@ -24,52 +25,123 @@ class TestBot < Ebooks::Bot
|
|||
end
|
||||
end
|
||||
|
||||
def twitter_id
|
||||
533295311591337984
|
||||
end
|
||||
module Ebooks::Test
|
||||
# Generates a random twitter id
|
||||
def twitter_id
|
||||
(rand*10**18).to_i
|
||||
end
|
||||
|
||||
def mock_dm(username, text)
|
||||
Twitter::DirectMessage.new(id: twitter_id,
|
||||
sender: { id: twitter_id, screen_name: username},
|
||||
text: text)
|
||||
end
|
||||
# Creates a mock direct message
|
||||
# @param username User sending the DM
|
||||
# @param text DM content
|
||||
def mock_dm(username, text)
|
||||
Twitter::DirectMessage.new(id: twitter_id,
|
||||
sender: { id: twitter_id, screen_name: username},
|
||||
text: text)
|
||||
end
|
||||
|
||||
def mock_tweet(username, text)
|
||||
mentions = text.split.find_all { |x| x.start_with?('@') }
|
||||
Twitter::Tweet.new(
|
||||
id: twitter_id,
|
||||
user: { id: twitter_id, screen_name: username },
|
||||
text: text,
|
||||
entities: {
|
||||
user_mentions: mentions.map { |m|
|
||||
{ screen_name: m.split('@')[1],
|
||||
indices: [text.index(m), text.index(m)+m.length] }
|
||||
# Creates a mock tweet
|
||||
# @param username User sending the tweet
|
||||
# @param text Tweet content
|
||||
def mock_tweet(username, text)
|
||||
mentions = text.split.find_all { |x| x.start_with?('@') }
|
||||
Twitter::Tweet.new(
|
||||
id: twitter_id,
|
||||
user: { id: twitter_id, screen_name: username },
|
||||
text: text,
|
||||
created_at: Time.now.to_s,
|
||||
entities: {
|
||||
user_mentions: mentions.map { |m|
|
||||
{ screen_name: m.split('@')[1],
|
||||
indices: [text.index(m), text.index(m)+m.length] }
|
||||
}
|
||||
}
|
||||
}
|
||||
)
|
||||
)
|
||||
end
|
||||
|
||||
def simulate(bot, &b)
|
||||
bot.twitter = spy("twitter")
|
||||
b.call
|
||||
end
|
||||
|
||||
def expect_direct_message(bot, content)
|
||||
expect(bot.twitter).to have_received(:create_direct_message).with(anything(), content, {})
|
||||
bot.twitter = spy("twitter")
|
||||
end
|
||||
|
||||
def expect_tweet(bot, content)
|
||||
expect(bot.twitter).to have_received(:update).with(content, anything())
|
||||
bot.twitter = spy("twitter")
|
||||
end
|
||||
end
|
||||
|
||||
|
||||
describe Ebooks::Bot do
|
||||
include Ebooks::Test
|
||||
let(:bot) { TestBot.new }
|
||||
|
||||
before { Timecop.freeze }
|
||||
after { Timecop.return }
|
||||
|
||||
it "responds to dms" do
|
||||
bot.twitter = double("twitter")
|
||||
expect(bot.twitter).to receive(:create_direct_message).with("m1sp", "echo: this is a dm", {})
|
||||
bot.receive_event(mock_dm("m1sp", "this is a dm"))
|
||||
simulate(bot) do
|
||||
bot.receive_event(mock_dm("m1sp", "this is a dm"))
|
||||
expect_direct_message(bot, "echo: this is a dm")
|
||||
end
|
||||
end
|
||||
|
||||
it "responds to mentions" do
|
||||
bot.twitter = double("twitter")
|
||||
expect(bot.twitter).to receive(:update).with("@m1sp echo: this is a mention",
|
||||
in_reply_to_status_id: twitter_id)
|
||||
bot.receive_event(mock_tweet("m1sp", "@test_ebooks this is a mention"))
|
||||
simulate(bot) do
|
||||
bot.receive_event(mock_tweet("m1sp", "@test_ebooks this is a mention"))
|
||||
expect_tweet(bot, "@m1sp echo: this is a mention")
|
||||
end
|
||||
end
|
||||
|
||||
it "responds to timeline tweets" do
|
||||
bot.twitter = double("twitter")
|
||||
expect(bot.twitter).to receive(:update).with("@m1sp fine tweet good sir",
|
||||
in_reply_to_status_id: twitter_id)
|
||||
simulate(bot) do
|
||||
bot.receive_event(mock_tweet("m1sp", "some excellent tweet"))
|
||||
expect_tweet(bot, "@m1sp fine tweet good sir")
|
||||
end
|
||||
end
|
||||
|
||||
bot.receive_event(mock_tweet("m1sp", "some excellent tweet"))
|
||||
it "stops mentioning people after a certain limit" do
|
||||
simulate(bot) do
|
||||
bot.receive_event(mock_tweet("spammer", "@test_ebooks @m1sp 1"))
|
||||
expect_tweet(bot, "@spammer @m1sp echo: 1")
|
||||
|
||||
Timecop.travel(Time.now + 60)
|
||||
bot.receive_event(mock_tweet("spammer", "@test_ebooks @m1sp 2"))
|
||||
expect_tweet(bot, "@spammer @m1sp echo: 2")
|
||||
|
||||
Timecop.travel(Time.now + 60)
|
||||
bot.receive_event(mock_tweet("spammer", "@test_ebooks @m1sp 3"))
|
||||
expect_tweet(bot, "@spammer echo: 3")
|
||||
end
|
||||
end
|
||||
|
||||
it "doesn't stop mentioning them if they reply" do
|
||||
simulate(bot) do
|
||||
bot.receive_event(mock_tweet("spammer", "@test_ebooks @m1sp 4"))
|
||||
expect_tweet(bot, "@spammer @m1sp echo: 4")
|
||||
|
||||
Timecop.travel(Time.now + 60)
|
||||
bot.receive_event(mock_tweet("m1sp", "@spammer @test_ebooks 5"))
|
||||
expect_tweet(bot, "@m1sp @spammer echo: 5")
|
||||
|
||||
Timecop.travel(Time.now + 60)
|
||||
bot.receive_event(mock_tweet("spammer", "@test_ebooks @m1sp 6"))
|
||||
expect_tweet(bot, "@spammer @m1sp echo: 6")
|
||||
end
|
||||
end
|
||||
|
||||
it "doesn't get into infinite bot conversations" do
|
||||
simulate(bot) do
|
||||
bot.receive_event(mock_tweet("spammer", "@test_ebooks @m1sp 7"))
|
||||
expect_tweet(bot, "@spammer @m1sp echo: 7")
|
||||
|
||||
Timecop.travel(Time.now + 10)
|
||||
bot.receive_event(mock_tweet("spammer", "@test_ebooks @m1sp 8"))
|
||||
expect(bot.twitter).to_not have_received(:update)
|
||||
end
|
||||
end
|
||||
end
|
||||
|
|
|
@ -19,6 +19,7 @@ Gem::Specification.new do |gem|
|
|||
gem.add_development_dependency 'rspec-mocks'
|
||||
gem.add_development_dependency 'memory_profiler'
|
||||
gem.add_development_dependency 'pry-byebug'
|
||||
gem.add_development_dependency 'timecop'
|
||||
|
||||
gem.add_runtime_dependency 'twitter', '~> 5.0'
|
||||
gem.add_runtime_dependency 'simple_oauth'
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue