Skip to content
Snippets Groups Projects
process_feed_service.rb 8.84 KiB
Newer Older
Eugen Rochko's avatar
Eugen Rochko committed
class ProcessFeedService < BaseService
Eugen Rochko's avatar
Eugen Rochko committed
  def call(body, account)
    xml = Nokogiri::XML(body)
    xml.encoding = 'utf-8'
    update_author(body, account)
    process_entries(xml, account)
Eugen Rochko's avatar
Eugen Rochko committed

  def update_author(body, account)
    RemoteProfileUpdateWorker.perform_async(account.id, body.force_encoding('UTF-8'), true)
  def process_entries(xml, account)
    xml.xpath('//xmlns:entry', xmlns: TagManager::XMLNS).reverse_each.map { |entry| ProcessEntry.new.call(entry, account) }.compact
  class ProcessEntry
    def call(xml, account)
      @account = account
      @xml     = xml
      return if skip_unsupported_type?
      case verb
      when :post, :share
        return create_status
      when :delete
        return delete_status
    rescue ActiveRecord::RecordInvalid => e
      Rails.logger.debug "Nothing was saved for #{id} because: #{e}"
      nil
    private
    def create_status
      if redis.exists("delete_upon_arrival:#{id}")
        Rails.logger.debug "Delete for status #{id} was queued, ignoring"
        return
      end

      Rails.logger.debug "Creating remote status #{id}"
Eugen Rochko's avatar
Eugen Rochko committed

      ApplicationRecord.transaction do
        status, just_created = status_from_xml(@xml)

        return if status.nil?
        return status unless just_created
        if verb == :share
          original_status = shared_status_from_xml(@xml.at_xpath('.//activity:object', activity: TagManager::AS_XMLNS))
          status.reblog   = original_status
Eugen Rochko's avatar
Eugen Rochko committed

          if original_status.nil?
            status.destroy
            return nil
          elsif original_status.reblog?
            status.reblog = original_status.reblog
          end
Eugen Rochko's avatar
Eugen Rochko committed
        end
      notify_about_mentions!(status) unless status.reblog?
      notify_about_reblog!(status) if status.reblog? && status.reblog.account.local?
      Rails.logger.debug "Queuing remote status #{status.id} (#{id}) for distribution"

      LinkCrawlWorker.perform_async(status.id) unless status.spoiler_text.present?
      DistributionWorker.perform_async(status.id)
      status
    def notify_about_mentions!(status)
      status.mentions.includes(:account).each do |mention|
        mentioned_account = mention.account
        next unless mentioned_account.local?
        NotifyService.new.call(mentioned_account, mention)
      end
    end

    def notify_about_reblog!(status)
      NotifyService.new.call(status.reblog.account, status)
    end

    def delete_status
      Rails.logger.debug "Deleting remote status #{id}"
      status = Status.find_by(uri: id)

      if status.nil?
        redis.setex("delete_upon_arrival:#{id}", 6 * 3_600, id)
      else
        RemoveStatusService.new.call(status)
      end

    def skip_unsupported_type?
      !([:post, :share, :delete].include?(verb) && [:activity, :note, :comment].include?(type))
    end
    def shared_status_from_xml(entry)
      status = find_status(id(entry))

      return status unless status.nil?

      FetchRemoteStatusService.new.call(url(entry))
    end

    def status_from_xml(entry)
      # Return early if status already exists in db
      status = find_status(id(entry))
      # If status embeds an author, find that author
      # If that author cannot be found, don't record the status (do not misattribute)
      if account?(entry)
        begin
          account = author_from_xml(entry)
      return [nil, false] if account.suspended?
        uri: id(entry),
        url: url(entry),
Eugen Rochko's avatar
Eugen Rochko committed
        account: account,
        text: content(entry),
Eugen's avatar
Eugen committed
        language: content_language(entry),
        visibility: visibility_scope(entry),
        conversation: find_or_create_conversation(entry)

      if thread?(entry)
Eugen Rochko's avatar
Eugen Rochko committed
        Rails.logger.debug "Trying to attach #{status.id} (#{id(entry)}) to #{thread(entry).first}"
        status.thread = find_or_resolve_status(status, *thread(entry))
      end
      mentions_from_xml(status, entry)
      hashtags_from_xml(status, entry)
      media_from_xml(status, entry)
Eugen Rochko's avatar
Eugen Rochko committed

    def find_or_resolve_status(parent, uri, url)
      status = find_status(uri)
      ThreadResolveWorker.perform_async(parent.id, url) if status.nil?
      status
    end
    def find_or_create_conversation(xml)
      uri = xml.at_xpath('./ostatus:conversation', ostatus: TagManager::OS_XMLNS)&.attribute('ref')&.content
      return if uri.nil?

      if TagManager.instance.local_id?(uri)
        local_id = TagManager.instance.unique_tag_to_local_id(uri, 'Conversation')
        return Conversation.find_by(id: local_id)
      end

      Conversation.find_by(uri: uri)
    end

    def find_status(uri)
      if TagManager.instance.local_id?(uri)
        local_id = TagManager.instance.unique_tag_to_local_id(uri, 'Status')
        return Status.find_by(id: local_id)

      Status.find_by(uri: uri)
    def mentions_from_xml(parent, xml)
      processed_account_ids = []
      xml.xpath('./xmlns:link[@rel="mentioned"]', xmlns: TagManager::XMLNS).each do |link|
        next if [TagManager::TYPES[:group], TagManager::TYPES[:collection]].include? link['ostatus:object-type']
        mentioned_account = account_from_href(link['href'])
Eugen Rochko's avatar
Eugen Rochko committed

        next if mentioned_account.nil? || processed_account_ids.include?(mentioned_account.id)
        mentioned_account.mentions.where(status: parent).first_or_create(status: parent)
        # So we can skip duplicate mentions
        processed_account_ids << mentioned_account.id
      end
      url = Addressable::URI.parse(href).normalize

      if TagManager.instance.web_domain?(url.host)
        Account.find_local(url.path.gsub('/users/', ''))
      else
        Account.where(uri: href).or(Account.where(url: href)).first || FetchRemoteAccountService.new.call(href)
    def hashtags_from_xml(parent, xml)
      tags = xml.xpath('./xmlns:category', xmlns: TagManager::XMLNS).map { |category| category['term'] }.select(&:present?)
      ProcessHashtagsService.new.call(parent, tags)
Eugen Rochko's avatar
Eugen Rochko committed

    def media_from_xml(parent, xml)
      do_not_download = DomainBlock.find_by(domain: parent.account.domain)&.reject_media?
      xml.xpath('./xmlns:link[@rel="enclosure"]', xmlns: TagManager::XMLNS).each do |link|
        next unless link['href']
        media = MediaAttachment.where(status: parent, remote_url: link['href']).first_or_initialize(account: parent.account, status: parent, remote_url: link['href'])
        parsed_url = Addressable::URI.parse(link['href']).normalize
        next if !%w(http https).include?(parsed_url.scheme) || parsed_url.host.empty?

        media.save

        next if do_not_download
Eugen Rochko's avatar
Eugen Rochko committed

        begin
          media.file_remote_url = link['href']
          media.save!
        rescue ActiveRecord::RecordInvalid
Eugen Rochko's avatar
Eugen Rochko committed
    end
    def id(xml = @xml)
      xml.at_xpath('./xmlns:id', xmlns: TagManager::XMLNS).content
    def verb(xml = @xml)
      raw = xml.at_xpath('./activity:verb', activity: TagManager::AS_XMLNS).content
      TagManager::VERBS.key(raw)
    rescue
      :post
    def type(xml = @xml)
      raw = xml.at_xpath('./activity:object-type', activity: TagManager::AS_XMLNS).content
      TagManager::TYPES.key(raw)
    rescue
      :activity
    end
    def url(xml = @xml)
      link = xml.at_xpath('./xmlns:link[@rel="alternate"]', xmlns: TagManager::XMLNS)
    def content(xml = @xml)
      xml.at_xpath('./xmlns:content', xmlns: TagManager::XMLNS).content
Eugen's avatar
Eugen committed
    def content_language(xml = @xml)
      xml.at_xpath('./xmlns:content', xmlns: TagManager::XMLNS)['xml:lang']&.presence || 'en'
    end

      xml.at_xpath('./xmlns:summary', xmlns: TagManager::XMLNS)&.content || ''
    def visibility_scope(xml = @xml)
      xml.at_xpath('./mastodon:scope', mastodon: TagManager::MTDN_XMLNS)&.content&.to_sym || :public
    end

    def published(xml = @xml)
      xml.at_xpath('./xmlns:published', xmlns: TagManager::XMLNS).content
    def thread?(xml = @xml)
      !xml.at_xpath('./thr:in-reply-to', thr: TagManager::THR_XMLNS).nil?
    def thread(xml = @xml)
      thr = xml.at_xpath('./thr:in-reply-to', thr: TagManager::THR_XMLNS)
      [thr['ref'], thr['href']]
    end
    def account?(xml = @xml)
      !xml.at_xpath('./xmlns:author', xmlns: TagManager::XMLNS).nil?
Eugen Rochko's avatar
Eugen Rochko committed
end