47 lines
1.2 KiB
Ruby
47 lines
1.2 KiB
Ruby
|
class FetchAtomService < BaseService
|
||
|
def call(url)
|
||
|
response = http_client.head(url)
|
||
|
|
||
|
Rails.logger.debug "Remote status HEAD request returned code #{response.code}"
|
||
|
return nil if response.code != 200
|
||
|
|
||
|
if response.mime_type == 'application/atom+xml'
|
||
|
return [url, fetch(url)]
|
||
|
elsif !response['Link'].blank?
|
||
|
return process_headers(response)
|
||
|
else
|
||
|
return process_html(fetch(url))
|
||
|
end
|
||
|
end
|
||
|
|
||
|
private
|
||
|
|
||
|
def process_html(body)
|
||
|
Rails.logger.debug "Processing HTML"
|
||
|
|
||
|
page = Nokogiri::HTML(body)
|
||
|
alternate_link = page.xpath('//link[@rel="alternate"]').find { |link| link['type'] == 'application/atom+xml' }
|
||
|
|
||
|
return nil if alternate_link.nil?
|
||
|
return [alternate_link['href'], fetch(alternate_link['href'])]
|
||
|
end
|
||
|
|
||
|
def process_headers(response)
|
||
|
Rails.logger.debug "Processing link header"
|
||
|
|
||
|
link_header = LinkHeader.parse(response['Link'])
|
||
|
alternate_link = link_header.find_link(['rel', 'alternate'], ['type', 'application/atom+xml'])
|
||
|
|
||
|
return nil if alternate_link.nil?
|
||
|
return [alternate_link.href, fetch(alternate_link.href)]
|
||
|
end
|
||
|
|
||
|
def fetch(url)
|
||
|
http_client.get(url).to_s
|
||
|
end
|
||
|
|
||
|
def http_client
|
||
|
HTTP.timeout(:per_operation, write: 20, connect: 20, read: 50)
|
||
|
end
|
||
|
end
|