HEX
Server: Apache/2.4.41 (Ubuntu)
System: Linux vmi1674223.contaboserver.net 5.4.0-182-generic #202-Ubuntu SMP Fri Apr 26 12:29:36 UTC 2024 x86_64
User: root (0)
PHP: 7.4.3-4ubuntu2.22
Disabled: pcntl_alarm,pcntl_fork,pcntl_waitpid,pcntl_wait,pcntl_wifexited,pcntl_wifstopped,pcntl_wifsignaled,pcntl_wifcontinued,pcntl_wexitstatus,pcntl_wtermsig,pcntl_wstopsig,pcntl_signal,pcntl_signal_get_handler,pcntl_signal_dispatch,pcntl_get_last_error,pcntl_strerror,pcntl_sigprocmask,pcntl_sigwaitinfo,pcntl_sigtimedwait,pcntl_exec,pcntl_getpriority,pcntl_setpriority,pcntl_async_signals,pcntl_unshare,
Upload Files
File: //opt/openproject/app/workers/extract_fulltext_job.rb
#-- encoding: UTF-8

#-- copyright
# OpenProject is an open source project management software.
# Copyright (C) 2012-2020 the OpenProject GmbH
#
# This program is free software; you can redistribute it and/or
# modify it under the terms of the GNU General Public License version 3.
#
# OpenProject is a fork of ChiliProject, which is a fork of Redmine. The copyright follows:
# Copyright (C) 2006-2017 Jean-Philippe Lang
# Copyright (C) 2010-2013 the ChiliProject Team
#
# This program is free software; you can redistribute it and/or
# modify it under the terms of the GNU General Public License
# as published by the Free Software Foundation; either version 2
# of the License, or (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.
#
# See docs/COPYRIGHT.rdoc for more details.
#++

class ExtractFulltextJob < ApplicationJob
  queue_with_priority :low

  def perform(attachment_id)
    @attachment_id = attachment_id
    @attachment = nil
    @text = nil
    @file = nil
    @filename = nil
    @language = OpenProject::Configuration.main_content_language

    return unless OpenProject::Database.allows_tsv?
    return unless @attachment = find_attachment(attachment_id)

    init
    update
  ensure
    FileUtils.rm @file.path if delete_file?
  end

  private

  def init
    carrierwave_uploader = @attachment.file
    @file = carrierwave_uploader.local_file
    @filename = carrierwave_uploader.file.filename

    if @attachment.readable?
      resolver = Plaintext::Resolver.new(@file, @attachment.content_type)
      @text = resolver.text
    end
  rescue StandardError => e
    Rails.logger.error(
      "Failed to extract plaintext from file #{@attachment&.id} (On domain #{Setting.host_name}): #{e}: #{e.message}"
    )
  end

  def update
    Attachment
      .where(id: @attachment_id)
      .update_all(['fulltext = ?, fulltext_tsv = to_tsvector(?, ?), file_tsv = to_tsvector(?, ?)',
                   @text,
                   @language,
                   OpenProject::FullTextSearch.normalize_text(@text),
                   @language,
                   OpenProject::FullTextSearch.normalize_filename(@filename)])
  rescue StandardError => e
    Rails.logger.error(
      "Failed to update TSV values for attachment #{@attachment&.id} (On domain #{Setting.host_name}): #{e.message[0..499]}[...]"
    )
  end

  def find_attachment(id)
    Attachment.find_by_id id
  end

  def remote_file?
    !@attachment&.file.is_a?(LocalFileUploader)
  end

  def delete_file?
    remote_file? && @file
  end
end