donphan/app/services/process_feed_service.rb

252 lines
7.9 KiB
Ruby
Raw Normal View History

2016-02-24 11:57:29 +00:00
class ProcessFeedService < BaseService
2016-10-10 17:05:52 +01:00
ACTIVITY_NS = 'http://activitystrea.ms/spec/1.0/'.freeze
THREAD_NS = 'http://purl.org/syndication/thread/1.0'.freeze
2016-02-24 11:57:29 +00:00
# Create local statuses from an Atom feed
# @param [String] body Atom feed
# @param [Account] account Account this feed belongs to
# @return [Enumerable] created statuses
2016-02-20 21:53:20 +00:00
def call(body, account)
xml = Nokogiri::XML(body)
2016-09-29 20:28:21 +01:00
update_remote_profile_service.call(xml.at_xpath('/xmlns:feed/xmlns:author'), account) unless xml.at_xpath('/xmlns:feed').nil?
xml.xpath('//xmlns:entry').reverse_each.map { |entry| process_entry(account, entry) }.compact
end
2016-02-20 21:53:20 +00:00
private
def process_entry(account, entry)
return unless [:note, :comment, :activity].include? object_type(entry)
status = Status.find_by(uri: activity_id(entry))
# If we already have a post and the verb is now "delete", we gotta delete it and move on!
if !status.nil? && verb(entry) == :delete
delete_post!(status)
return
end
2016-03-16 09:46:15 +00:00
return unless status.nil?
status = Status.new(uri: activity_id(entry), url: activity_link(entry), account: account, text: content(entry), created_at: published(entry), updated_at: updated(entry))
if verb(entry) == :share
add_reblog!(entry, status)
elsif verb(entry) == :post
if thread_id(entry).nil?
add_post!(entry, status)
else
add_reply!(entry, status)
end
2016-10-10 14:27:39 +01:00
else
return
end
2016-02-24 23:17:01 +00:00
# If we added a status, go through accounts it mentions and create respective relations
# Also record all media attachments for the status and for the reblogged status if present
unless status.new_record?
record_remote_mentions(status, entry.xpath('./xmlns:link[@rel="mentioned"]'))
2016-10-10 18:09:11 +01:00
record_remote_mentions(status.reblog, entry.at_xpath('./activity:object', activity: ACTIVITY_NS).xpath('./xmlns:link[@rel="mentioned"]')) if status.reblog?
process_attachments(entry, status)
2016-10-10 17:05:52 +01:00
process_attachments(entry.xpath('./activity:object', activity: ACTIVITY_NS), status.reblog) if status.reblog?
DistributionWorker.perform_async(status.id)
return status
end
end
def record_remote_mentions(status, links)
return if status.local?
# Here we have to do a reverse lookup of local accounts by their URL!
# It's not pretty at all! I really wish all these protocols sticked to
# using acct:username@domain only! It would make things so much easier
# and tidier
links.each do |mention_link|
href_val = mention_link.attribute('href').value
next if href_val == 'http://activityschema.org/collection/public'
2016-09-29 20:28:21 +01:00
href = Addressable::URI.parse(href_val)
2016-10-06 15:36:16 +01:00
if TagManager.instance.local_domain?(href.host)
# A local user is mentioned
mentioned_account = Account.find_local(href.path.gsub('/users/', ''))
unless mentioned_account.nil?
mentioned_account.mentions.where(status: status).first_or_create(status: status)
NotificationMailer.mention(mentioned_account, status).deliver_later unless mentioned_account.blocking?(status.account)
end
else
# What to do about remote user?
# This is kinda dodgy because URLs could change, we don't index them
mentioned_account = Account.find_by(url: href.to_s)
if mentioned_account.nil?
2016-09-29 20:28:21 +01:00
mentioned_account = FetchRemoteAccountService.new.call(href)
end
unless mentioned_account.nil?
mentioned_account.mentions.where(status: status).first_or_create(status: status)
end
end
end
end
def process_attachments(entry, status)
return if status.local?
entry.xpath('./xmlns:link[@rel="enclosure"]').each do |enclosure_link|
next if enclosure_link.attribute('href').nil?
media = MediaAttachment.where(status: status, remote_url: enclosure_link.attribute('href').value).first
next unless media.nil?
2016-09-29 20:28:21 +01:00
2016-10-12 18:25:46 +01:00
begin
media = MediaAttachment.new(account: status.account, status: status, remote_url: enclosure_link.attribute('href').value)
media.file_remote_url = enclosure_link.attribute('href').value
media.save
rescue Paperclip::Errors::NotIdentifiedByImageMagickError
Rails.logger.debug "Error saving attachment from #{enclosure_link.attribute('href').value}"
next
end
end
end
def add_post!(_entry, status)
status.save!
end
def add_reblog!(entry, status)
status.reblog = find_original_status(entry, target_id(entry))
2016-02-24 16:23:59 +00:00
if status.reblog.nil?
status.reblog = fetch_remote_status(entry)
end
if !status.reblog.nil?
status.save!
NotificationMailer.reblog(status.reblog, status.account).deliver_later if status.reblog.local? && !status.reblog.account.blocking?(status.account)
end
end
def add_reply!(entry, status)
status.thread = find_original_status(entry, thread_id(entry))
2016-02-24 16:23:59 +00:00
status.save!
if status.thread.nil? && !thread_href(entry).nil?
ThreadResolveWorker.perform_async(status.id, thread_href(entry))
end
end
2016-02-20 21:53:20 +00:00
2016-03-16 09:46:15 +00:00
def delete_post!(status)
2016-09-29 20:28:21 +01:00
remove_status_service.call(status)
2016-03-16 09:46:15 +00:00
end
def find_original_status(_xml, id)
return nil if id.nil?
2016-02-20 21:53:20 +00:00
if TagManager.instance.local_id?(id)
Status.find(TagManager.instance.unique_tag_to_local_id(id, 'Status'))
else
2016-02-24 16:23:59 +00:00
Status.find_by(uri: id)
2016-02-20 21:53:20 +00:00
end
end
2016-02-24 16:23:59 +00:00
def fetch_remote_status(xml)
2016-10-10 18:09:11 +01:00
username = xml.at_xpath('./activity:object', activity: ACTIVITY_NS).at_xpath('./xmlns:author/xmlns:name').content
url = xml.at_xpath('./activity:object', activity: ACTIVITY_NS).at_xpath('./xmlns:author/xmlns:uri').content
2016-02-24 16:23:59 +00:00
domain = Addressable::URI.parse(url).host
account = Account.find_remote(username, domain)
2016-02-24 16:23:59 +00:00
if account.nil?
2016-09-29 20:28:21 +01:00
account = follow_remote_account_service.call("#{username}@#{domain}")
2016-02-24 16:23:59 +00:00
end
2016-09-18 11:28:49 +01:00
status = Status.new(account: account, uri: target_id(xml), text: target_content(xml), url: target_url(xml), created_at: published(xml), updated_at: updated(xml))
status.thread = find_original_status(xml, thread_id(xml))
2016-10-02 22:46:25 +01:00
if status.save && status.thread.nil? && !thread_href(xml).nil?
ThreadResolveWorker.perform_async(status.id, thread_href(xml))
end
status
rescue Goldfinger::Error, HTTP::Error
nil
end
def published(xml)
xml.at_xpath('./xmlns:published').content
end
def updated(xml)
xml.at_xpath('./xmlns:updated').content
end
def content(xml)
2016-10-10 15:03:38 +01:00
xml.at_xpath('./xmlns:content').try(:content)
end
def thread_id(xml)
2016-10-10 17:05:52 +01:00
xml.at_xpath('./thr:in-reply-to', thr: THREAD_NS).attribute('ref').value
rescue
nil
end
def thread_href(xml)
2016-10-10 17:05:52 +01:00
xml.at_xpath('./thr:in-reply-to', thr: THREAD_NS).attribute('href').value
rescue
nil
end
def target_id(xml)
2016-10-10 18:09:11 +01:00
xml.at_xpath('.//activity:object', activity: ACTIVITY_NS).at_xpath('./xmlns:id').content
rescue
nil
end
def activity_id(xml)
xml.at_xpath('./xmlns:id').content
end
def activity_link(xml)
xml.at_xpath('./xmlns:link[@rel="alternate"]').attribute('href').value
rescue
''
end
2016-02-24 16:23:59 +00:00
def target_content(xml)
2016-10-10 18:09:11 +01:00
xml.at_xpath('.//activity:object', activity: ACTIVITY_NS).at_xpath('./xmlns:content').content
2016-02-24 16:23:59 +00:00
end
def target_url(xml)
2016-10-12 18:25:46 +01:00
xml.at_xpath('.//activity:object', activity: ACTIVITY_NS).at_xpath('./xmlns:link[@rel="alternate"]').attribute('href').value
2016-02-24 16:23:59 +00:00
end
def object_type(xml)
2016-10-10 17:05:52 +01:00
xml.at_xpath('./activity:object-type', activity: ACTIVITY_NS).content.gsub('http://activitystrea.ms/schema/1.0/', '').gsub('http://ostatus.org/schema/1.0/', '').to_sym
rescue
:activity
end
def verb(xml)
2016-10-10 17:05:52 +01:00
xml.at_xpath('./activity:verb', activity: ACTIVITY_NS).content.gsub('http://activitystrea.ms/schema/1.0/', '').gsub('http://ostatus.org/schema/1.0/', '').to_sym
rescue
:post
end
def follow_remote_account_service
2016-02-24 11:57:29 +00:00
@follow_remote_account_service ||= FollowRemoteAccountService.new
end
2016-02-24 23:17:01 +00:00
def update_remote_profile_service
@update_remote_profile_service ||= UpdateRemoteProfileService.new
end
def remove_status_service
@remove_status_service ||= RemoveStatusService.new
end
2016-02-20 21:53:20 +00:00
end