openstreetmap-website/lib/rich_text.rb

184 lines
3.9 KiB
Ruby

module RichText
SPAMMY_PHRASES = [
"Business Description:", "Additional Keywords:"
].freeze
MAX_DESCRIPTION_LENGTH = 500
def self.new(format, text)
case format
when "html" then HTML.new(text || "")
when "markdown" then Markdown.new(text || "")
when "text" then Text.new(text || "")
end
end
class SimpleFormat
include ActionView::Helpers::TextHelper
include ActionView::Helpers::OutputSafetyHelper
def sanitize(text, _options = {})
Sanitize.clean(text, Sanitize::Config::OSM).html_safe
end
end
class Base < String
include ActionView::Helpers::TagHelper
def spam_score
link_count = 0
link_size = 0
doc = Nokogiri::HTML(to_html)
if doc.content.empty?
link_proportion = 0
else
doc.xpath("//a").each do |link|
link_count += 1
link_size += link.content.length
end
link_proportion = link_size.to_f / doc.content.length
end
spammy_phrases = SPAMMY_PHRASES.count do |phrase|
doc.content.include?(phrase)
end
([link_proportion - 0.2, 0.0].max * 200) +
(link_count * 40) +
(spammy_phrases * 40)
end
def image
nil
end
def image_alt
nil
end
def description
nil
end
protected
def simple_format(text)
SimpleFormat.new.simple_format(text)
end
def sanitize(text)
Sanitize.clean(text, Sanitize::Config::OSM).html_safe
end
def linkify(text, mode = :urls)
if text.html_safe?
Rinku.auto_link(text, mode, tag_builder.tag_options(:rel => "nofollow noopener noreferrer")).html_safe
else
Rinku.auto_link(text, mode, tag_builder.tag_options(:rel => "nofollow noopener noreferrer"))
end
end
end
class HTML < Base
def to_html
linkify(sanitize(simple_format(self)))
end
def to_text
to_s
end
end
class Markdown < Base
def to_html
linkify(sanitize(document.to_html), :all)
end
def to_text
to_s
end
def image
@image_element = first_image_element(document.root) unless defined? @image_element
@image_element.attr["src"] if @image_element
end
def image_alt
@image_element = first_image_element(document.root) unless defined? @image_element
@image_element.attr["alt"] if @image_element
end
def description
return @description if defined? @description
@description = first_truncated_text_content(document.root)
end
private
def document
@document ||= Kramdown::Document.new(self)
end
def first_image_element(element)
return element if image?(element) && element.attr["src"].present?
element.children.find do |child|
nested_image = first_image_element(child)
break nested_image if nested_image
end
end
def first_truncated_text_content(element)
if paragraph?(element)
truncated_text_content(element)
else
element.children.find do |child|
text = first_truncated_text_content(child)
break text unless text.nil?
end
end
end
def truncated_text_content(element)
text = ""
append_text = lambda do |child|
if child.type == :text
text << child.value
else
child.children.each do |c|
append_text.call(c)
break if text.length > MAX_DESCRIPTION_LENGTH
end
end
end
append_text.call(element)
return nil if text.blank?
text.truncate(MAX_DESCRIPTION_LENGTH)
end
def image?(element)
element.type == :img || (element.type == :html_element && element.value == "img")
end
def paragraph?(element)
element.type == :p || (element.type == :html_element && element.value == "p")
end
end
class Text < Base
def to_html
linkify(simple_format(ERB::Util.html_escape(self)))
end
def to_text
to_s
end
end
end