1 # frozen_string_literal: true
5 "Business Description:", "Additional Keywords:"
8 MAX_DESCRIPTION_LENGTH = 500
10 def self.new(format, text)
12 when "html" then HTML.new(text || "")
13 when "markdown" then Markdown.new(text || "")
14 when "text" then Text.new(text || "")
19 include ActionView::Helpers::TextHelper
20 include ActionView::Helpers::OutputSafetyHelper
22 def sanitize(text, _options = {})
23 Sanitize.clean(text, Sanitize::Config::OSM).html_safe
32 doc = Nokogiri::HTML(to_html)
37 doc.xpath("//a").each do |link|
39 link_size += link.content.length
42 link_proportion = link_size.to_f / doc.content.length
45 spammy_phrases = SPAMMY_PHRASES.count do |phrase|
46 doc.content.include?(phrase)
49 ([link_proportion - 0.2, 0.0].max * 200) +
68 def simple_format(text)
69 SimpleFormat.new.simple_format(text, :dir => "auto")
73 Sanitize.clean(text, Sanitize::Config::OSM).html_safe
76 def linkify(text, mode = :urls)
77 link_attr = 'rel="nofollow noopener noreferrer"'
78 Rinku.auto_link(ERB::Util.html_escape(text), mode, link_attr) do |url|
79 url = shorten_host(url, Settings.linkify_hosts, Settings.linkify_hosts_replacement)
80 shorten_host(url, Settings.linkify_wiki_hosts, Settings.linkify_wiki_hosts_replacement) do |path|
81 path.sub(Regexp.new(Settings.linkify_wiki_optional_path_prefix || ""), "")
88 def shorten_host(url, hosts, hosts_replacement)
89 %r{^(https?://([^/]*))(.*)$}.match(url) do |m|
90 scheme_host, host, path = m.captures
91 if hosts&.include?(host)
92 path = yield(path) if block_given?
94 "#{hosts_replacement}#{path}"
96 "#{scheme_host}#{path}"
105 linkify(simple_format(self))
113 class Markdown < Base
115 linkify(sanitize(document.to_html), :all)
123 @image_element = first_image_element(document.root) unless defined? @image_element
124 @image_element.attr["src"] if @image_element
128 @image_element = first_image_element(document.root) unless defined? @image_element
129 @image_element.attr["alt"] if @image_element
133 return @description if defined? @description
135 @description = first_truncated_text_content(document.root)
141 @document ||= Kramdown::Document.new(self)
144 def first_image_element(element)
145 return element if image?(element) && element.attr["src"].present?
147 element.children.find do |child|
148 nested_image = first_image_element(child)
149 break nested_image if nested_image
153 def first_truncated_text_content(element)
154 if paragraph?(element)
155 truncated_text_content(element)
157 element.children.find do |child|
158 text = first_truncated_text_content(child)
159 break text unless text.nil?
164 def truncated_text_content(element)
167 append_text = lambda do |child|
168 if child.type == :text
171 child.children.each do |c|
173 break if text.length > MAX_DESCRIPTION_LENGTH
177 append_text.call(element)
179 return nil if text.blank?
181 text.truncate(MAX_DESCRIPTION_LENGTH)
185 element.type == :img || (element.type == :html_element && element.value == "img")
188 def paragraph?(element)
189 element.type == :p || (element.type == :html_element && element.value == "p")
195 linkify(simple_format(ERB::Util.html_escape(self)))