Fix #54 - Fetch remote accounts by URL from mentions
Fetching atom extracted from FetchRemoteAccountService and FetchRemoteStatusService into FetchAtomService. Mentions of the constant "http://activityschema.org/collection/public" skipped as it's not a real URL/user.
This commit is contained in:
parent
0bd4608ad1
commit
c6b0311b86
11 changed files with 99 additions and 67 deletions
46
app/services/fetch_atom_service.rb
Normal file
46
app/services/fetch_atom_service.rb
Normal file
|
@ -0,0 +1,46 @@
|
|||
class FetchAtomService < BaseService
|
||||
def call(url)
|
||||
response = http_client.head(url)
|
||||
|
||||
Rails.logger.debug "Remote status HEAD request returned code #{response.code}"
|
||||
return nil if response.code != 200
|
||||
|
||||
if response.mime_type == 'application/atom+xml'
|
||||
return [url, fetch(url)]
|
||||
elsif !response['Link'].blank?
|
||||
return process_headers(response)
|
||||
else
|
||||
return process_html(fetch(url))
|
||||
end
|
||||
end
|
||||
|
||||
private
|
||||
|
||||
def process_html(body)
|
||||
Rails.logger.debug "Processing HTML"
|
||||
|
||||
page = Nokogiri::HTML(body)
|
||||
alternate_link = page.xpath('//link[@rel="alternate"]').find { |link| link['type'] == 'application/atom+xml' }
|
||||
|
||||
return nil if alternate_link.nil?
|
||||
return [alternate_link['href'], fetch(alternate_link['href'])]
|
||||
end
|
||||
|
||||
def process_headers(response)
|
||||
Rails.logger.debug "Processing link header"
|
||||
|
||||
link_header = LinkHeader.parse(response['Link'])
|
||||
alternate_link = link_header.find_link(['rel', 'alternate'], ['type', 'application/atom+xml'])
|
||||
|
||||
return nil if alternate_link.nil?
|
||||
return [alternate_link.href, fetch(alternate_link.href)]
|
||||
end
|
||||
|
||||
def fetch(url)
|
||||
http_client.get(url).to_s
|
||||
end
|
||||
|
||||
def http_client
|
||||
HTTP.timeout(:per_operation, write: 20, connect: 20, read: 50)
|
||||
end
|
||||
end
|
Loading…
Add table
Add a link
Reference in a new issue