]> git.openstreetmap.org Git - rails.git/blobdiff - lib/rich_text.rb
Use reports_count so that counter_cache works automatically.
[rails.git] / lib / rich_text.rb
index ec5e9e473789a9d70c7e8fb770cac51e14be8137..db296967ba3aa13d43371a67ba2dec87505cf8a2 100644 (file)
@@ -1,28 +1,58 @@
 module RichText
+  SPAMMY_PHRASES = [
+    "Business Description:", "Additional Keywords:"
+  ].freeze
+
   def self.new(format, text)
     case format
-    when "html"; HTML.new(text || "")
-    when "markdown"; Markdown.new(text || "")
-    else; nil
+    when "html" then HTML.new(text || "")
+    when "markdown" then Markdown.new(text || "")
+    when "text" then Text.new(text || "")
     end
   end
 
-  class HTML < String
+  class SimpleFormat
     include ActionView::Helpers::TextHelper
-    include ActionView::Helpers::TagHelper
+    include ActionView::Helpers::OutputSafetyHelper
 
-    def to_html
-      linkify(sanitize(simple_format(self)))
+    def sanitize(text)
+      Sanitize.clean(text, Sanitize::Config::OSM).html_safe
     end
+  end
 
-    def to_text
-      self
+  class Base < String
+    include ActionView::Helpers::TagHelper
+
+    def spam_score
+      link_count = 0
+      link_size = 0
+
+      doc = Nokogiri::HTML(to_html)
+
+      if doc.content.empty?
+        link_proportion = 0
+      else
+        doc.xpath("//a").each do |link|
+          link_count += 1
+          link_size += link.content.length
+        end
+
+        link_proportion = link_size.to_f / doc.content.length.to_f
+      end
+
+      spammy_phrases = SPAMMY_PHRASES.count do |phrase|
+        doc.content.include?(phrase)
+      end
+
+      [link_proportion - 0.2, 0.0].max * 200 +
+        link_count * 40 +
+        spammy_phrases * 40
     end
 
-  private
+    protected
 
-    def sanitize(text)
-      Sanitize.clean(text, Sanitize::Config::OSM).html_safe
+    def simple_format(text)
+      SimpleFormat.new.simple_format(text)
     end
 
     def linkify(text)
@@ -34,24 +64,47 @@ module RichText
     end
   end
 
-  class Markdown < String
+  class HTML < Base
     def to_html
-      html_parser.render(self).html_safe
+      linkify(sanitize(simple_format(self)))
     end
 
     def to_text
-      self
+      to_s
     end
 
-  private
+    private
 
-    def html_parser
-      @@html_renderer ||= Redcarpet::Render::XHTML.new({
-        :filter_html => true, :safe_links_only => true
-      })
-      @@html_parser ||= Redcarpet::Markdown.new(@@html_renderer, {
-        :no_intra_emphasis => true, :autolink => true, :space_after_headers => true
-      })
+    def sanitize(text)
+      Sanitize.clean(text, Sanitize::Config::OSM).html_safe
+    end
+  end
+
+  class Markdown < Base
+    def to_html
+      Markdown.html_parser.render(self).html_safe
+    end
+
+    def to_text
+      to_s
+    end
+
+    def self.html_renderer
+      @html_renderer ||= Redcarpet::Render::XHTML.new(:filter_html => true, :safe_links_only => true, :link_attributes => { :rel => "nofollow" })
+    end
+
+    def self.html_parser
+      @html_parser ||= Redcarpet::Markdown.new(html_renderer, :no_intra_emphasis => true, :autolink => true, :space_after_headers => true)
+    end
+  end
+
+  class Text < Base
+    def to_html
+      linkify(simple_format(ERB::Util.html_escape(self)))
+    end
+
+    def to_text
+      to_s
     end
   end
 end