2017-04-27 22:42:22 +10:00
|
|
|
# frozen_string_literal: true
|
|
|
|
|
|
|
|
class Sanitize
|
|
|
|
module Config
|
2020-02-09 07:22:38 +11:00
|
|
|
HTTP_PROTOCOLS = %w(
|
|
|
|
http
|
|
|
|
https
|
|
|
|
).freeze
|
|
|
|
|
|
|
|
LINK_PROTOCOLS = %w(
|
|
|
|
http
|
|
|
|
https
|
|
|
|
dat
|
|
|
|
dweb
|
|
|
|
ipfs
|
|
|
|
ipns
|
|
|
|
ssb
|
|
|
|
gopher
|
|
|
|
xmpp
|
|
|
|
magnet
|
2020-10-20 02:02:13 +11:00
|
|
|
gemini
|
2020-02-09 07:22:38 +11:00
|
|
|
).freeze
|
2017-04-27 22:42:22 +10:00
|
|
|
|
2017-06-18 04:26:05 +10:00
|
|
|
CLASS_WHITELIST_TRANSFORMER = lambda do |env|
|
|
|
|
node = env[:node]
|
2018-01-03 13:54:08 +11:00
|
|
|
class_list = node['class']&.split(/[\t\n\f\r ]/)
|
2017-06-18 04:26:05 +10:00
|
|
|
|
|
|
|
return unless class_list
|
|
|
|
|
|
|
|
class_list.keep_if do |e|
|
2021-01-22 20:09:08 +11:00
|
|
|
next true if /^(h|p|u|dt|e)-/.match?(e) # microformats classes
|
|
|
|
next true if /^(mention|hashtag)$/.match?(e) # semantic classes
|
|
|
|
next true if /^(ellipsis|invisible)$/.match?(e) # link formatting classes
|
2017-06-18 04:26:05 +10:00
|
|
|
end
|
|
|
|
|
|
|
|
node['class'] = class_list.join(' ')
|
|
|
|
end
|
|
|
|
|
2020-02-09 07:22:38 +11:00
|
|
|
UNSUPPORTED_HREF_TRANSFORMER = lambda do |env|
|
|
|
|
return unless env[:node_name] == 'a'
|
|
|
|
|
|
|
|
current_node = env[:node]
|
|
|
|
|
2023-02-19 09:09:40 +11:00
|
|
|
scheme = if current_node['href'] =~ Sanitize::REGEX_PROTOCOL
|
|
|
|
Regexp.last_match(1).downcase
|
|
|
|
else
|
|
|
|
:relative
|
|
|
|
end
|
2020-02-09 07:22:38 +11:00
|
|
|
|
2023-01-12 08:21:10 +11:00
|
|
|
current_node.replace(Nokogiri::XML::Text.new(current_node.text, current_node.document)) unless LINK_PROTOCOLS.include?(scheme)
|
2020-02-09 07:22:38 +11:00
|
|
|
end
|
|
|
|
|
2019-06-17 05:46:36 +10:00
|
|
|
UNSUPPORTED_ELEMENTS_TRANSFORMER = lambda do |env|
|
|
|
|
return unless %w(h1 h2 h3 h4 h5 h6 blockquote pre ul ol li).include?(env[:node_name])
|
|
|
|
|
2020-02-09 07:22:38 +11:00
|
|
|
current_node = env[:node]
|
|
|
|
|
2019-06-17 05:46:36 +10:00
|
|
|
case env[:node_name]
|
|
|
|
when 'li'
|
2020-02-09 07:22:38 +11:00
|
|
|
current_node.traverse do |node|
|
2019-07-19 09:44:58 +10:00
|
|
|
next unless %w(p ul ol li).include?(node.name)
|
|
|
|
|
2019-06-17 05:46:36 +10:00
|
|
|
node.add_next_sibling('<br>') if node.next_sibling
|
|
|
|
node.replace(node.children) unless node.text?
|
|
|
|
end
|
|
|
|
else
|
2020-02-09 07:22:38 +11:00
|
|
|
current_node.name = 'p'
|
2019-06-17 05:46:36 +10:00
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2017-04-27 22:42:22 +10:00
|
|
|
MASTODON_STRICT ||= freeze_config(
|
|
|
|
elements: %w(p br span a),
|
|
|
|
|
|
|
|
attributes: {
|
2023-02-20 16:58:28 +11:00
|
|
|
'a' => %w(href rel class),
|
2017-04-27 22:42:22 +10:00
|
|
|
'span' => %w(class),
|
|
|
|
},
|
|
|
|
|
2017-04-30 08:28:41 +10:00
|
|
|
add_attributes: {
|
|
|
|
'a' => {
|
2019-10-25 07:44:42 +11:00
|
|
|
'rel' => 'nofollow noopener noreferrer',
|
2017-04-30 08:28:41 +10:00
|
|
|
'target' => '_blank',
|
|
|
|
},
|
|
|
|
},
|
|
|
|
|
2020-02-09 07:22:38 +11:00
|
|
|
protocols: {},
|
2017-06-18 04:26:05 +10:00
|
|
|
|
|
|
|
transformers: [
|
|
|
|
CLASS_WHITELIST_TRANSFORMER,
|
2019-06-17 05:46:36 +10:00
|
|
|
UNSUPPORTED_ELEMENTS_TRANSFORMER,
|
2020-02-09 07:22:38 +11:00
|
|
|
UNSUPPORTED_HREF_TRANSFORMER,
|
2017-06-18 04:26:05 +10:00
|
|
|
]
|
2017-04-27 22:42:22 +10:00
|
|
|
)
|
|
|
|
|
|
|
|
MASTODON_OEMBED ||= freeze_config merge(
|
|
|
|
RELAXED,
|
|
|
|
elements: RELAXED[:elements] + %w(audio embed iframe source video),
|
|
|
|
|
|
|
|
attributes: merge(
|
|
|
|
RELAXED[:attributes],
|
2023-02-20 16:58:28 +11:00
|
|
|
'audio' => %w(controls),
|
|
|
|
'embed' => %w(height src type width),
|
2017-04-27 22:42:22 +10:00
|
|
|
'iframe' => %w(allowfullscreen frameborder height scrolling src width),
|
|
|
|
'source' => %w(src type),
|
2023-02-20 16:58:28 +11:00
|
|
|
'video' => %w(controls height loop width),
|
|
|
|
'div' => [:data]
|
2017-04-27 22:42:22 +10:00
|
|
|
),
|
|
|
|
|
|
|
|
protocols: merge(
|
|
|
|
RELAXED[:protocols],
|
2023-02-20 16:58:28 +11:00
|
|
|
'embed' => { 'src' => HTTP_PROTOCOLS },
|
2017-04-27 22:42:22 +10:00
|
|
|
'iframe' => { 'src' => HTTP_PROTOCOLS },
|
|
|
|
'source' => { 'src' => HTTP_PROTOCOLS }
|
|
|
|
)
|
|
|
|
)
|
|
|
|
end
|
|
|
|
end
|