2019-07-10 16:59:28 +00:00
|
|
|
# frozen_string_literal: true
|
|
|
|
|
|
|
|
class FetchResourceService < BaseService
|
|
|
|
include JsonLdHelper
|
|
|
|
|
2020-01-09 23:10:29 +00:00
|
|
|
ACCEPT_HEADER = 'application/activity+json, application/ld+json; profile="https://www.w3.org/ns/activitystreams", text/html;q=0.1'
|
2023-05-04 03:33:55 +00:00
|
|
|
ACTIVITY_STREAM_LINK_TYPES = ['application/activity+json', 'application/ld+json; profile="https://www.w3.org/ns/activitystreams"'].freeze
|
2019-07-10 16:59:28 +00:00
|
|
|
|
2020-03-12 22:06:43 +00:00
|
|
|
attr_reader :response_code
|
|
|
|
|
2019-07-10 16:59:28 +00:00
|
|
|
def call(url)
|
|
|
|
return if url.blank?
|
|
|
|
|
|
|
|
process(url)
|
|
|
|
rescue HTTP::Error, OpenSSL::SSL::SSLError, Addressable::URI::InvalidURIError, Mastodon::HostValidationError, Mastodon::LengthValidationError => e
|
2023-02-07 02:44:36 +00:00
|
|
|
Rails.logger.debug { "Error fetching resource #{@url}: #{e}" }
|
2019-07-10 16:59:28 +00:00
|
|
|
nil
|
|
|
|
end
|
|
|
|
|
|
|
|
private
|
|
|
|
|
2023-05-30 07:28:01 +00:00
|
|
|
def process(url, terminal: false)
|
2019-07-10 16:59:28 +00:00
|
|
|
@url = url
|
|
|
|
|
|
|
|
perform_request { |response| process_response(response, terminal) }
|
|
|
|
end
|
|
|
|
|
|
|
|
def perform_request(&block)
|
2020-04-25 20:01:08 +00:00
|
|
|
Request.new(:get, @url).tap do |request|
|
|
|
|
request.add_headers('Accept' => ACCEPT_HEADER)
|
|
|
|
|
|
|
|
# In a real setting we want to sign all outgoing requests,
|
|
|
|
# in case the remote server has secure mode enabled and requires
|
|
|
|
# authentication on all resources. However, during development,
|
|
|
|
# sending request signatures with an inaccessible host is useless
|
|
|
|
# and prevents even public resources from being fetched, so
|
|
|
|
# don't do it
|
|
|
|
|
|
|
|
request.on_behalf_of(Account.representative) unless Rails.env.development?
|
|
|
|
end.perform(&block)
|
2019-07-10 16:59:28 +00:00
|
|
|
end
|
|
|
|
|
|
|
|
def process_response(response, terminal = false)
|
2020-03-12 22:06:43 +00:00
|
|
|
@response_code = response.code
|
2019-07-10 16:59:28 +00:00
|
|
|
return nil if response.code != 200
|
|
|
|
|
2024-02-16 10:56:12 +00:00
|
|
|
if valid_activitypub_content_type?(response)
|
2019-07-10 16:59:28 +00:00
|
|
|
body = response.body_with_limit
|
|
|
|
json = body_to_json(body)
|
|
|
|
|
2024-02-01 14:56:46 +00:00
|
|
|
return unless supported_context?(json) && (equals_or_includes_any?(json['type'], ActivityPub::FetchRemoteActorService::SUPPORTED_TYPES) || expected_type?(json))
|
|
|
|
|
|
|
|
if json['id'] != @url
|
|
|
|
return if terminal
|
|
|
|
|
|
|
|
return process(json['id'], terminal: true)
|
|
|
|
end
|
|
|
|
|
|
|
|
[@url, { prefetched_body: body }]
|
2019-07-10 16:59:28 +00:00
|
|
|
elsif !terminal
|
|
|
|
link_header = response['Link'] && parse_link_header(response)
|
|
|
|
|
|
|
|
if link_header&.find_link(%w(rel alternate))
|
|
|
|
process_link_headers(link_header)
|
|
|
|
elsif response.mime_type == 'text/html'
|
|
|
|
process_html(response)
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
def expected_type?(json)
|
|
|
|
equals_or_includes_any?(json['type'], ActivityPub::Activity::Create::SUPPORTED_TYPES + ActivityPub::Activity::Create::CONVERTED_TYPES)
|
|
|
|
end
|
|
|
|
|
|
|
|
def process_html(response)
|
2024-09-08 18:41:37 +00:00
|
|
|
page = Nokogiri::HTML5(response.body_with_limit)
|
2023-05-04 03:33:55 +00:00
|
|
|
json_link = page.xpath('//link[@rel="alternate"]').find { |link| ACTIVITY_STREAM_LINK_TYPES.include?(link['type']) }
|
2019-07-10 16:59:28 +00:00
|
|
|
|
|
|
|
process(json_link['href'], terminal: true) unless json_link.nil?
|
|
|
|
end
|
|
|
|
|
|
|
|
def process_link_headers(link_header)
|
|
|
|
json_link = link_header.find_link(%w(rel alternate), %w(type application/activity+json)) || link_header.find_link(%w(rel alternate), ['type', 'application/ld+json; profile="https://www.w3.org/ns/activitystreams"'])
|
|
|
|
|
|
|
|
process(json_link.href, terminal: true) unless json_link.nil?
|
|
|
|
end
|
|
|
|
|
|
|
|
def parse_link_header(response)
|
|
|
|
LinkHeader.parse(response['Link'].is_a?(Array) ? response['Link'].first : response['Link'])
|
|
|
|
end
|
|
|
|
end
|