]> git.openstreetmap.org Git - rails.git/blob - lib/rich_text.rb
Remove html-safe/unsafe branches from rich text linkify
[rails.git] / lib / rich_text.rb
1 # frozen_string_literal: true
2
3 module RichText
4   SPAMMY_PHRASES = [
5     "Business Description:", "Additional Keywords:"
6   ].freeze
7
8   MAX_DESCRIPTION_LENGTH = 500
9
10   def self.new(format, text)
11     case format
12     when "html" then HTML.new(text || "")
13     when "markdown" then Markdown.new(text || "")
14     when "text" then Text.new(text || "")
15     end
16   end
17
18   class SimpleFormat
19     include ActionView::Helpers::TextHelper
20     include ActionView::Helpers::OutputSafetyHelper
21
22     def sanitize(text, _options = {})
23       Sanitize.clean(text, Sanitize::Config::OSM).html_safe
24     end
25   end
26
27   class Base < String
28     include ActionView::Helpers::TagHelper
29
30     def spam_score
31       link_count = 0
32       link_size = 0
33
34       doc = Nokogiri::HTML(to_html)
35
36       if doc.content.empty?
37         link_proportion = 0
38       else
39         doc.xpath("//a").each do |link|
40           link_count += 1
41           link_size += link.content.length
42         end
43
44         link_proportion = link_size.to_f / doc.content.length
45       end
46
47       spammy_phrases = SPAMMY_PHRASES.count do |phrase|
48         doc.content.include?(phrase)
49       end
50
51       ([link_proportion - 0.2, 0.0].max * 200) +
52         (link_count * 40) +
53         (spammy_phrases * 40)
54     end
55
56     def image
57       nil
58     end
59
60     def image_alt
61       nil
62     end
63
64     def description
65       nil
66     end
67
68     protected
69
70     def simple_format(text)
71       SimpleFormat.new.simple_format(text, :dir => "auto")
72     end
73
74     def sanitize(text)
75       Sanitize.clean(text, Sanitize::Config::OSM).html_safe
76     end
77
78     def linkify(text, mode = :urls)
79       Rinku.auto_link(ERB::Util.html_escape(text), mode, tag_builder.tag_options(:rel => "nofollow noopener noreferrer")).html_safe
80     end
81   end
82
83   class HTML < Base
84     def to_html
85       linkify(sanitize(simple_format(self)))
86     end
87
88     def to_text
89       to_s
90     end
91   end
92
93   class Markdown < Base
94     def to_html
95       linkify(sanitize(document.to_html), :all)
96     end
97
98     def to_text
99       to_s
100     end
101
102     def image
103       @image_element = first_image_element(document.root) unless defined? @image_element
104       @image_element.attr["src"] if @image_element
105     end
106
107     def image_alt
108       @image_element = first_image_element(document.root) unless defined? @image_element
109       @image_element.attr["alt"] if @image_element
110     end
111
112     def description
113       return @description if defined? @description
114
115       @description = first_truncated_text_content(document.root)
116     end
117
118     private
119
120     def document
121       @document ||= Kramdown::Document.new(self)
122     end
123
124     def first_image_element(element)
125       return element if image?(element) && element.attr["src"].present?
126
127       element.children.find do |child|
128         nested_image = first_image_element(child)
129         break nested_image if nested_image
130       end
131     end
132
133     def first_truncated_text_content(element)
134       if paragraph?(element)
135         truncated_text_content(element)
136       else
137         element.children.find do |child|
138           text = first_truncated_text_content(child)
139           break text unless text.nil?
140         end
141       end
142     end
143
144     def truncated_text_content(element)
145       text = +""
146
147       append_text = lambda do |child|
148         if child.type == :text
149           text << child.value
150         else
151           child.children.each do |c|
152             append_text.call(c)
153             break if text.length > MAX_DESCRIPTION_LENGTH
154           end
155         end
156       end
157       append_text.call(element)
158
159       return nil if text.blank?
160
161       text.truncate(MAX_DESCRIPTION_LENGTH)
162     end
163
164     def image?(element)
165       element.type == :img || (element.type == :html_element && element.value == "img")
166     end
167
168     def paragraph?(element)
169       element.type == :p || (element.type == :html_element && element.value == "p")
170     end
171   end
172
173   class Text < Base
174     def to_html
175       linkify(simple_format(ERB::Util.html_escape(self)))
176     end
177
178     def to_text
179       to_s
180     end
181   end
182 end