You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
46 lines
1.3 KiB
46 lines
1.3 KiB
class FetchAtomService < BaseService |
|
def call(url) |
|
response = http_client.head(url) |
|
|
|
Rails.logger.debug "Remote status HEAD request returned code #{response.code}" |
|
return nil if response.code != 200 |
|
|
|
if response.mime_type == 'application/atom+xml' |
|
return [url, fetch(url)] |
|
elsif !response['Link'].blank? |
|
return process_headers(url, response) |
|
else |
|
return process_html(fetch(url)) |
|
end |
|
end |
|
|
|
private |
|
|
|
def process_html(body) |
|
Rails.logger.debug 'Processing HTML' |
|
|
|
page = Nokogiri::HTML(body) |
|
alternate_link = page.xpath('//link[@rel="alternate"]').find { |link| link['type'] == 'application/atom+xml' } |
|
|
|
return nil if alternate_link.nil? |
|
return [alternate_link['href'], fetch(alternate_link['href'])] |
|
end |
|
|
|
def process_headers(url, response) |
|
Rails.logger.debug 'Processing link header' |
|
|
|
link_header = LinkHeader.parse(response['Link'].is_a?(Array) ? response['Link'].first : response['Link']) |
|
alternate_link = link_header.find_link(['rel', 'alternate'], ['type', 'application/atom+xml']) |
|
|
|
return process_html(fetch(url)) if alternate_link.nil? |
|
return [alternate_link.href, fetch(alternate_link.href)] |
|
end |
|
|
|
def fetch(url) |
|
http_client.get(url).to_s |
|
end |
|
|
|
def http_client |
|
HTTP.timeout(:per_operation, write: 20, connect: 20, read: 50).follow |
|
end |
|
end
|
|
|