X-Git-Url: https://git.openstreetmap.org./rails.git/blobdiff_plain/9a9b045372a6f48420a9a6dacfde52c34ab7abce..03408b6294e0aa56d46823c1f44d47aaf69e226b:/lib/rich_text.rb?ds=inline diff --git a/lib/rich_text.rb b/lib/rich_text.rb index 7325a2a28..db296967b 100644 --- a/lib/rich_text.rb +++ b/lib/rich_text.rb @@ -1,4 +1,8 @@ module RichText + SPAMMY_PHRASES = [ + "Business Description:", "Additional Keywords:" + ].freeze + def self.new(format, text) case format when "html" then HTML.new(text || "") @@ -25,18 +29,24 @@ module RichText doc = Nokogiri::HTML(to_html) - if doc.content.length > 0 + if doc.content.empty? + link_proportion = 0 + else doc.xpath("//a").each do |link| link_count += 1 link_size += link.content.length end link_proportion = link_size.to_f / doc.content.length.to_f - else - link_proportion = 0 end - [link_proportion - 0.2, 0.0].max * 200 + link_count * 40 + spammy_phrases = SPAMMY_PHRASES.count do |phrase| + doc.content.include?(phrase) + end + + [link_proportion - 0.2, 0.0].max * 200 + + link_count * 40 + + spammy_phrases * 40 end protected @@ -80,26 +90,12 @@ module RichText end def self.html_renderer - @html_renderer ||= Renderer.new(:filter_html => true, :safe_links_only => true) + @html_renderer ||= Redcarpet::Render::XHTML.new(:filter_html => true, :safe_links_only => true, :link_attributes => { :rel => "nofollow" }) end def self.html_parser @html_parser ||= Redcarpet::Markdown.new(html_renderer, :no_intra_emphasis => true, :autolink => true, :space_after_headers => true) end - - class Renderer < Redcarpet::Render::XHTML - def link(link, _title, alt_text) - "#{alt_text}" - end - - def autolink(link, link_type) - if link_type == :email - "#{link}" - else - "#{link}" - end - end - end end class Text < Base