|
|
|
@ -4,18 +4,10 @@ class FetchAtomService < BaseService
|
|
|
|
|
def call(url)
|
|
|
|
|
return if url.blank?
|
|
|
|
|
|
|
|
|
|
response = Request.new(:head, url).perform
|
|
|
|
|
@url = url
|
|
|
|
|
|
|
|
|
|
Rails.logger.debug "Remote status HEAD request returned code #{response.code}"
|
|
|
|
|
|
|
|
|
|
response = Request.new(:get, url).perform if response.code == 405
|
|
|
|
|
|
|
|
|
|
Rails.logger.debug "Remote status GET request returned code #{response.code}"
|
|
|
|
|
|
|
|
|
|
return nil if response.code != 200
|
|
|
|
|
return [url, fetch(url)] if response.mime_type == 'application/atom+xml'
|
|
|
|
|
return process_headers(url, response) if response['Link'].present?
|
|
|
|
|
process_html(fetch(url))
|
|
|
|
|
perform_request
|
|
|
|
|
process_response
|
|
|
|
|
rescue OpenSSL::SSL::SSLError => e
|
|
|
|
|
Rails.logger.debug "SSL error: #{e}"
|
|
|
|
|
nil
|
|
|
|
@ -26,27 +18,57 @@ class FetchAtomService < BaseService
|
|
|
|
|
|
|
|
|
|
private
|
|
|
|
|
|
|
|
|
|
def process_html(body)
|
|
|
|
|
Rails.logger.debug 'Processing HTML'
|
|
|
|
|
def perform_request
|
|
|
|
|
@response = Request.new(:get, @url)
|
|
|
|
|
.add_headers('Accept' => 'application/activity+json, application/ld+json, application/atom+xml, text/html')
|
|
|
|
|
.perform
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
page = Nokogiri::HTML(body)
|
|
|
|
|
alternate_link = page.xpath('//link[@rel="alternate"]').find { |link| link['type'] == 'application/atom+xml' }
|
|
|
|
|
def process_response(terminal = false)
|
|
|
|
|
return nil if @response.code != 200
|
|
|
|
|
|
|
|
|
|
return nil if alternate_link.nil?
|
|
|
|
|
[alternate_link['href'], fetch(alternate_link['href'])]
|
|
|
|
|
if @response.mime_type == 'application/atom+xml'
|
|
|
|
|
[@url, @response.to_s, :ostatus]
|
|
|
|
|
elsif ['application/activity+json', 'application/ld+json; profile="https://www.w3.org/ns/activitystreams"'].include?(@response.mime_type)
|
|
|
|
|
[@url, @response.to_s, :activitypub]
|
|
|
|
|
elsif @response['Link'] && !terminal
|
|
|
|
|
process_headers
|
|
|
|
|
elsif @response.mime_type == 'text/html' && !terminal
|
|
|
|
|
process_html
|
|
|
|
|
end
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
def process_headers(url, response)
|
|
|
|
|
Rails.logger.debug 'Processing link header'
|
|
|
|
|
def process_html
|
|
|
|
|
page = Nokogiri::HTML(@response.to_s)
|
|
|
|
|
|
|
|
|
|
link_header = LinkHeader.parse(response['Link'].is_a?(Array) ? response['Link'].first : response['Link'])
|
|
|
|
|
alternate_link = link_header.find_link(%w(rel alternate), %w(type application/atom+xml))
|
|
|
|
|
json_link = page.xpath('//link[@rel="alternate"]').find { |link| ['application/activity+json', 'application/ld+json; profile="https://www.w3.org/ns/activitystreams"'].include?(link['type']) }
|
|
|
|
|
atom_link = page.xpath('//link[@rel="alternate"]').find { |link| link['type'] == 'application/atom+xml' }
|
|
|
|
|
|
|
|
|
|
return process_html(fetch(url)) if alternate_link.nil?
|
|
|
|
|
[alternate_link.href, fetch(alternate_link.href)]
|
|
|
|
|
if !json_link.nil?
|
|
|
|
|
@url = json_link['href']
|
|
|
|
|
perform_request
|
|
|
|
|
process_response(true)
|
|
|
|
|
elsif !atom_link.nil?
|
|
|
|
|
@url = atom_link['href']
|
|
|
|
|
perform_request
|
|
|
|
|
process_response(true)
|
|
|
|
|
end
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
def process_headers
|
|
|
|
|
link_header = LinkHeader.parse(@response['Link'].is_a?(Array) ? @response['Link'].first : @response['Link'])
|
|
|
|
|
|
|
|
|
|
def fetch(url)
|
|
|
|
|
Request.new(:get, url).perform.to_s
|
|
|
|
|
json_link = link_header.find_link(%w(rel alternate), %w(type application/activity+json)) || link_header.find_link(%w(rel alternate), ['type', 'application/ld+json; profile="https://www.w3.org/ns/activitystreams"'])
|
|
|
|
|
atom_link = link_header.find_link(%w(rel alternate), %w(type application/atom+xml))
|
|
|
|
|
|
|
|
|
|
if !json_link.nil?
|
|
|
|
|
@url = json_link.href
|
|
|
|
|
perform_request
|
|
|
|
|
process_response(true)
|
|
|
|
|
elsif !atom_link.nil?
|
|
|
|
|
@url = atom_link.href
|
|
|
|
|
perform_request
|
|
|
|
|
process_response(true)
|
|
|
|
|
end
|
|
|
|
|
end
|
|
|
|
|
end
|
|
|
|
|