2017-04-27 15:42:22 +03:00
|
|
|
# frozen_string_literal: true
|
|
|
|
|
|
|
|
class Sanitize
|
|
|
|
module Config
|
2020-02-08 22:22:38 +02:00
|
|
|
HTTP_PROTOCOLS = %w(
|
|
|
|
http
|
|
|
|
https
|
|
|
|
).freeze
|
|
|
|
|
|
|
|
LINK_PROTOCOLS = %w(
|
|
|
|
http
|
|
|
|
https
|
|
|
|
dat
|
|
|
|
dweb
|
|
|
|
ipfs
|
|
|
|
ipns
|
|
|
|
ssb
|
|
|
|
gopher
|
|
|
|
xmpp
|
|
|
|
magnet
|
2020-10-19 18:02:13 +03:00
|
|
|
gemini
|
2020-02-08 22:22:38 +02:00
|
|
|
).freeze
|
2017-04-27 15:42:22 +03:00
|
|
|
|
2017-06-17 21:26:05 +03:00
|
|
|
CLASS_WHITELIST_TRANSFORMER = lambda do |env|
|
|
|
|
node = env[:node]
|
2018-01-03 04:54:08 +02:00
|
|
|
class_list = node['class']&.split(/[\t\n\f\r ]/)
|
2017-06-17 21:26:05 +03:00
|
|
|
|
|
|
|
return unless class_list
|
|
|
|
|
|
|
|
class_list.keep_if do |e|
|
2021-01-22 11:09:08 +02:00
|
|
|
next true if /^(h|p|u|dt|e)-/.match?(e) # microformats classes
|
|
|
|
next true if /^(mention|hashtag)$/.match?(e) # semantic classes
|
|
|
|
next true if /^(ellipsis|invisible)$/.match?(e) # link formatting classes
|
2022-12-25 04:48:52 +02:00
|
|
|
next true if /^quote-inline$/.match?(e) # quote inline classes
|
2017-06-17 21:26:05 +03:00
|
|
|
end
|
|
|
|
|
|
|
|
node['class'] = class_list.join(' ')
|
|
|
|
end
|
|
|
|
|
2019-05-26 16:10:33 +03:00
|
|
|
IMG_TAG_TRANSFORMER = lambda do |env|
|
|
|
|
node = env[:node]
|
|
|
|
|
|
|
|
return unless env[:node_name] == 'img'
|
|
|
|
|
|
|
|
node.name = 'a'
|
|
|
|
|
|
|
|
node['href'] = node['src']
|
2019-05-26 23:42:01 +03:00
|
|
|
if node['alt'].present?
|
|
|
|
node.content = "[🖼 #{node['alt']}]"
|
|
|
|
else
|
|
|
|
url = node['href']
|
2023-04-09 12:25:30 +03:00
|
|
|
prefix = url.match(%r{\Ahttps?://(www\.)?}).to_s
|
2019-05-26 23:42:01 +03:00
|
|
|
text = url[prefix.length, 30]
|
2023-04-09 12:25:30 +03:00
|
|
|
text += '…' if url.length - prefix.length > 30
|
2019-05-26 23:42:01 +03:00
|
|
|
node.content = "[🖼 #{text}]"
|
|
|
|
end
|
2019-05-26 16:10:33 +03:00
|
|
|
end
|
|
|
|
|
2023-06-20 19:10:19 +03:00
|
|
|
TRANSLATE_TRANSFORMER = lambda do |env|
|
|
|
|
node = env[:node]
|
|
|
|
node.remove_attribute('translate') unless node['translate'] == 'no'
|
|
|
|
end
|
|
|
|
|
2020-02-08 22:22:38 +02:00
|
|
|
UNSUPPORTED_HREF_TRANSFORMER = lambda do |env|
|
|
|
|
return unless env[:node_name] == 'a'
|
|
|
|
|
|
|
|
current_node = env[:node]
|
|
|
|
|
2023-02-19 00:09:40 +02:00
|
|
|
scheme = if current_node['href'] =~ Sanitize::REGEX_PROTOCOL
|
|
|
|
Regexp.last_match(1).downcase
|
|
|
|
else
|
|
|
|
:relative
|
|
|
|
end
|
2020-02-08 22:22:38 +02:00
|
|
|
|
2023-01-11 23:21:10 +02:00
|
|
|
current_node.replace(Nokogiri::XML::Text.new(current_node.text, current_node.document)) unless LINK_PROTOCOLS.include?(scheme)
|
2020-02-08 22:22:38 +02:00
|
|
|
end
|
|
|
|
|
2023-11-07 11:11:50 +02:00
|
|
|
MASTODON_STRICT = freeze_config(
|
2019-08-14 23:26:30 +03:00
|
|
|
elements: %w(p br span a abbr del pre blockquote code b strong u sub sup i em h1 h2 h3 h4 h5 ul ol li),
|
2017-04-27 15:42:22 +03:00
|
|
|
|
|
|
|
attributes: {
|
2023-06-25 13:02:52 +03:00
|
|
|
'a' => %w(href rel class title translate),
|
2023-06-19 19:01:35 +03:00
|
|
|
'abbr' => %w(title),
|
2023-06-20 19:10:19 +03:00
|
|
|
'span' => %w(class translate),
|
Accept richer text from remote statuses
Support abbr, del, pre, blockquote, code, strong, b, em, i, and h1…h5
HTML elements in remote statuses, add corresponding CSS.
2019-04-17 15:23:36 +03:00
|
|
|
'blockquote' => %w(cite),
|
2023-03-03 21:19:29 +02:00
|
|
|
'ol' => %w(start reversed),
|
|
|
|
'li' => %w(value),
|
2017-04-27 15:42:22 +03:00
|
|
|
},
|
|
|
|
|
2017-04-30 01:28:41 +03:00
|
|
|
add_attributes: {
|
|
|
|
'a' => {
|
2022-03-28 21:51:51 +03:00
|
|
|
'rel' => 'nofollow noopener noreferrer',
|
2017-04-30 01:28:41 +03:00
|
|
|
'target' => '_blank',
|
|
|
|
},
|
|
|
|
},
|
|
|
|
|
2017-04-27 15:42:22 +03:00
|
|
|
protocols: {
|
2023-04-09 12:25:30 +03:00
|
|
|
'a' => { 'href' => LINK_PROTOCOLS },
|
2020-02-09 13:15:55 +02:00
|
|
|
'blockquote' => { 'cite' => LINK_PROTOCOLS },
|
2017-06-17 21:26:05 +03:00
|
|
|
},
|
|
|
|
|
|
|
|
transformers: [
|
|
|
|
CLASS_WHITELIST_TRANSFORMER,
|
2019-05-26 16:10:33 +03:00
|
|
|
IMG_TAG_TRANSFORMER,
|
2023-06-20 19:10:19 +03:00
|
|
|
TRANSLATE_TRANSFORMER,
|
2020-02-08 22:22:38 +02:00
|
|
|
UNSUPPORTED_HREF_TRANSFORMER,
|
2017-06-17 21:26:05 +03:00
|
|
|
]
|
2017-04-27 15:42:22 +03:00
|
|
|
)
|
|
|
|
|
2023-11-07 11:11:50 +02:00
|
|
|
MASTODON_OEMBED = freeze_config(
|
2023-07-06 16:03:33 +03:00
|
|
|
elements: %w(audio embed iframe source video),
|
2017-04-27 15:42:22 +03:00
|
|
|
|
2023-07-06 16:03:33 +03:00
|
|
|
attributes: {
|
2023-02-20 07:58:28 +02:00
|
|
|
'audio' => %w(controls),
|
|
|
|
'embed' => %w(height src type width),
|
2017-04-27 15:42:22 +03:00
|
|
|
'iframe' => %w(allowfullscreen frameborder height scrolling src width),
|
|
|
|
'source' => %w(src type),
|
2023-02-20 07:58:28 +02:00
|
|
|
'video' => %w(controls height loop width),
|
2023-07-06 16:03:33 +03:00
|
|
|
},
|
2017-04-27 15:42:22 +03:00
|
|
|
|
2023-07-06 16:03:33 +03:00
|
|
|
protocols: {
|
2023-02-20 07:58:28 +02:00
|
|
|
'embed' => { 'src' => HTTP_PROTOCOLS },
|
2017-04-27 15:42:22 +03:00
|
|
|
'iframe' => { 'src' => HTTP_PROTOCOLS },
|
2023-07-06 16:03:33 +03:00
|
|
|
'source' => { 'src' => HTTP_PROTOCOLS },
|
|
|
|
},
|
|
|
|
|
|
|
|
add_attributes: {
|
|
|
|
'iframe' => { 'sandbox' => 'allow-scripts allow-same-origin allow-popups allow-popups-to-escape-sandbox allow-forms' },
|
|
|
|
}
|
2017-04-27 15:42:22 +03:00
|
|
|
)
|
2022-03-28 21:51:51 +03:00
|
|
|
|
|
|
|
LINK_REL_TRANSFORMER = lambda do |env|
|
|
|
|
return unless env[:node_name] == 'a' && env[:node]['href']
|
|
|
|
|
|
|
|
node = env[:node]
|
|
|
|
|
2023-04-09 12:25:30 +03:00
|
|
|
rel = (node['rel'] || '').split & ['tag']
|
2023-05-08 20:26:00 +03:00
|
|
|
rel += %w(nofollow noopener noreferrer) unless TagManager.instance.local_url?(node['href'])
|
2022-03-28 21:51:51 +03:00
|
|
|
|
|
|
|
if rel.empty?
|
2022-04-11 09:40:18 +03:00
|
|
|
node.remove_attribute('rel')
|
2022-03-28 21:51:51 +03:00
|
|
|
else
|
|
|
|
node['rel'] = rel.join(' ')
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
LINK_TARGET_TRANSFORMER = lambda do |env|
|
|
|
|
return unless env[:node_name] == 'a' && env[:node]['href']
|
|
|
|
|
|
|
|
node = env[:node]
|
|
|
|
if node['target'] != '_blank' && TagManager.instance.local_url?(node['href'])
|
2022-04-11 09:40:18 +03:00
|
|
|
node.remove_attribute('target')
|
2022-03-28 21:51:51 +03:00
|
|
|
else
|
|
|
|
node['target'] = '_blank'
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2023-12-18 00:04:16 +02:00
|
|
|
MASTODON_OUTGOING = freeze_config MASTODON_STRICT.merge(
|
2022-03-28 21:51:51 +03:00
|
|
|
attributes: merge(
|
|
|
|
MASTODON_STRICT[:attributes],
|
2023-06-25 13:02:52 +03:00
|
|
|
'a' => %w(href rel class title target translate)
|
2022-03-28 21:51:51 +03:00
|
|
|
),
|
|
|
|
|
|
|
|
add_attributes: {},
|
|
|
|
|
|
|
|
transformers: [
|
|
|
|
CLASS_WHITELIST_TRANSFORMER,
|
|
|
|
IMG_TAG_TRANSFORMER,
|
2023-06-25 13:02:52 +03:00
|
|
|
TRANSLATE_TRANSFORMER,
|
2022-03-28 21:51:51 +03:00
|
|
|
UNSUPPORTED_HREF_TRANSFORMER,
|
|
|
|
LINK_REL_TRANSFORMER,
|
|
|
|
LINK_TARGET_TRANSFORMER,
|
|
|
|
]
|
|
|
|
)
|
2017-04-27 15:42:22 +03:00
|
|
|
end
|
|
|
|
end
|