require 'xml/libxml'
require 'digest/md5'
require 'RMagick'
+ require 'nokogiri'
# The base class for API Errors.
class APIError < RuntimeError
return "#{prefix}latitude BETWEEN #{minlat} AND #{maxlat} AND #{prefix}longitude BETWEEN #{minlon} AND #{maxlon}"
end
+ # Return a spam score for a chunk of text
+ def self.spam_score(text)
+ link_count = 0
+ link_size = 0
+ doc = Nokogiri::HTML(text)
+
+ if doc.content.length > 0
+ doc.xpath("//a").each do |link|
+ link_count += 1
+ link_size += link.content.length
+ end
+
+ link_proportion = link_size.to_f / doc.content.length.to_f
+ else
+ link_proportion = 0
+ end
+
+ return [link_proportion - 0.2, 0.0].max * 200 + link_count * 20
+ end
end