X-Git-Url: https://git.openstreetmap.org./rails.git/blobdiff_plain/34e3e51456774127d43408b7ab65c24f41373f62..90918ade9200275cb4382c2b1b3c253914fb8b0e:/lib/rich_text.rb diff --git a/lib/rich_text.rb b/lib/rich_text.rb index 4cd254720..db296967b 100644 --- a/lib/rich_text.rb +++ b/lib/rich_text.rb @@ -1,10 +1,13 @@ module RichText + SPAMMY_PHRASES = [ + "Business Description:", "Additional Keywords:" + ].freeze + def self.new(format, text) case format - when "html"; HTML.new(text || "") - when "markdown"; Markdown.new(text || "") - when "text"; Text.new(text || "") - else; nil + when "html" then HTML.new(text || "") + when "markdown" then Markdown.new(text || "") + when "text" then Text.new(text || "") end end @@ -26,21 +29,27 @@ module RichText doc = Nokogiri::HTML(to_html) - if doc.content.length > 0 + if doc.content.empty? + link_proportion = 0 + else doc.xpath("//a").each do |link| link_count += 1 link_size += link.content.length end link_proportion = link_size.to_f / doc.content.length.to_f - else - link_proportion = 0 end - return [link_proportion - 0.2, 0.0].max * 200 + link_count * 40 + spammy_phrases = SPAMMY_PHRASES.count do |phrase| + doc.content.include?(phrase) + end + + [link_proportion - 0.2, 0.0].max * 200 + + link_count * 40 + + spammy_phrases * 40 end - protected + protected def simple_format(text) SimpleFormat.new.simple_format(text) @@ -61,10 +70,10 @@ module RichText end def to_text - self.to_s + to_s end - private + private def sanitize(text) Sanitize.clean(text, Sanitize::Config::OSM).html_safe @@ -73,36 +82,19 @@ module RichText class Markdown < Base def to_html - html_parser.render(self).html_safe + Markdown.html_parser.render(self).html_safe end def to_text - self.to_s + to_s end - private - - def html_parser - @@html_renderer ||= Renderer.new({ - :filter_html => true, :safe_links_only => true - }) - @@html_parser ||= Redcarpet::Markdown.new(@@html_renderer, { - :no_intra_emphasis => true, :autolink => true, :space_after_headers => true - }) + def self.html_renderer + @html_renderer ||= Redcarpet::Render::XHTML.new(:filter_html => true, :safe_links_only => true, :link_attributes => { :rel => "nofollow" }) end - class Renderer < Redcarpet::Render::XHTML - def link(link, title, alt_text) - "#{alt_text}" - end - - def autolink(link, link_type) - if link_type == :email - "#{link}" - else - "#{link}" - end - end + def self.html_parser + @html_parser ||= Redcarpet::Markdown.new(html_renderer, :no_intra_emphasis => true, :autolink => true, :space_after_headers => true) end end @@ -112,7 +104,7 @@ module RichText end def to_text - self.to_s + to_s end end end