scinote-web/app/models/asset.rb

452 lines
13 KiB
Ruby
Raw Normal View History

# frozen_string_literal: true
2017-06-23 21:19:08 +08:00
class Asset < ApplicationRecord
2016-02-12 23:52:43 +08:00
include SearchableModel
include DatabaseHelper
2016-07-21 19:11:15 +08:00
include Encryptor
2016-08-03 21:31:25 +08:00
include WopiUtil
include ActiveStorageFileUtil
2019-09-23 22:33:57 +08:00
include ActiveStorageConcerns
2016-02-12 23:52:43 +08:00
require 'tempfile'
# Lock duration set to 30 minutes
2019-06-24 21:17:42 +08:00
LOCK_DURATION = 60 * 30
# ActiveStorage configuration
has_one_attached :file
2016-02-12 23:52:43 +08:00
# Asset validation
# This could cause some problems if you create empty asset and want to
# assign it to result
validate :step_or_result_or_repository_asset_value
validate :wopi_filename_valid,
on: :wopi_file_creation
2016-02-12 23:52:43 +08:00
2017-06-28 21:21:32 +08:00
belongs_to :created_by,
foreign_key: 'created_by_id',
class_name: 'User',
optional: true
2016-12-08 22:24:14 +08:00
belongs_to :last_modified_by,
foreign_key: 'last_modified_by_id',
2017-06-28 21:21:32 +08:00
class_name: 'User',
optional: true
belongs_to :team, optional: true
2018-03-10 00:04:54 +08:00
has_one :step_asset, inverse_of: :asset, dependent: :destroy
has_one :step, through: :step_asset, dependent: :nullify
has_one :result_asset, inverse_of: :asset, dependent: :destroy
has_one :result, through: :result_asset, dependent: :nullify
has_one :repository_asset_value, inverse_of: :asset, dependent: :destroy
has_one :repository_cell, through: :repository_asset_value,
2016-02-12 23:52:43 +08:00
dependent: :nullify
has_many :report_elements, inverse_of: :asset, dependent: :destroy
has_one :asset_text_datum, inverse_of: :asset, dependent: :destroy
after_save { result&.touch; step&.touch }
attr_accessor :file_content, :file_info, :in_template
2016-02-12 23:52:43 +08:00
def self.search(
user,
include_archived,
2016-02-12 23:52:43 +08:00
query = nil,
2017-05-05 22:41:23 +08:00
page = 1,
_current_team = nil,
options = {}
2016-02-12 23:52:43 +08:00
)
teams = user.teams.select(:id)
assets_in_steps = Asset.joins(:step).where(
'steps.id IN (?)',
Step.search(user, include_archived, nil, Constants::SEARCH_NO_LIMIT)
.select(:id)
).pluck(:id)
assets_in_results = Asset.joins(:result).where(
'results.id IN (?)',
Result.search(user, include_archived, nil, Constants::SEARCH_NO_LIMIT)
.select(:id)
).pluck(:id)
assets_in_inventories = Asset.joins(
repository_cell: { repository_column: :repository }
).where('repositories.team_id IN (?)', teams).pluck(:id)
assets =
Asset.distinct
.where('assets.id IN (?) OR assets.id IN (?) OR assets.id IN (?)',
assets_in_steps, assets_in_results, assets_in_inventories)
new_query = Asset.left_outer_joins(:asset_text_datum)
.joins(file_attachment: :blob)
.from(assets, 'assets')
2017-05-05 22:41:23 +08:00
a_query = s_query = ''
if options[:whole_word].to_s == 'true' ||
options[:whole_phrase].to_s == 'true'
like = options[:match_case].to_s == 'true' ? '~' : '~*'
s_query = query.gsub(/[!()&|:]/, ' ')
.strip
.split(/\s+/)
.map { |t| t + ':*' }
if options[:whole_word].to_s == 'true'
a_query = query.split
.map { |a| Regexp.escape(a) }
.join('|')
s_query = s_query.join('|')
else
a_query = Regexp.escape(query)
s_query = s_query.join('&')
end
a_query = '\\y(' + a_query + ')\\y'
s_query = s_query.tr('\'', '"')
new_query = new_query.where(
"(active_storage_blobs.filename #{like} ? " \
2016-07-21 19:11:15 +08:00
"OR asset_text_data.data_vector @@ to_tsquery(?))",
a_query,
s_query
2016-02-12 23:52:43 +08:00
)
2017-05-05 22:41:23 +08:00
else
like = options[:match_case].to_s == 'true' ? 'LIKE' : 'ILIKE'
a_query = query.split.map { |a| "%#{sanitize_sql_like(a)}%" }
# Trim whitespace and replace it with OR character. Make prefixed
# wildcard search term and escape special characters.
# For example, search term 'demo project' is transformed to
# 'demo:*|project:*' which makes word inclusive search with postfix
# wildcard.
s_query = query.gsub(/[!()&|:]/, ' ')
.strip
.split(/\s+/)
.map { |t| t + ':*' }
.join('|')
.tr('\'', '"')
new_query = new_query.where(
"(active_storage_blobs.filename #{like} ANY (array[?]) " \
2017-05-05 22:41:23 +08:00
"OR asset_text_data.data_vector @@ to_tsquery(?))",
a_query,
s_query
)
end
2016-02-12 23:52:43 +08:00
# Show all results if needed
if page != Constants::SEARCH_NO_LIMIT
new_query = new_query.select('assets.*, asset_text_data.data AS data')
.limit(Constants::SEARCH_LIMIT)
.offset((page - 1) * Constants::SEARCH_LIMIT)
Asset.select(
"assets_search.*, ts_headline(assets_search.data, to_tsquery('" +
sanitize_sql_for_conditions(s_query) +
"'), 'StartSel=<mark>, StopSel=</mark>') AS headline"
).from(new_query, 'assets_search')
else
new_query
2016-02-12 23:52:43 +08:00
end
end
def blob
file&.blob
end
2019-06-28 14:17:09 +08:00
def previewable?
return false unless file.attached?
previewable_document?(blob) || previewable_image?
2019-06-28 14:17:09 +08:00
end
2019-06-24 21:17:42 +08:00
def medium_preview
file.representation(resize_to_limit: Constants::MEDIUM_PIC_FORMAT)
2019-06-24 21:17:42 +08:00
end
def large_preview
file.representation(resize_to_limit: Constants::LARGE_PIC_FORMAT)
2019-06-28 14:17:09 +08:00
end
def file_name
return '' unless file.attached?
file.blob&.filename&.sanitized
2019-06-24 21:17:42 +08:00
end
def file_size
return 0 unless file.attached?
2019-06-28 14:17:09 +08:00
file.blob&.byte_size
2019-06-24 21:17:42 +08:00
end
def content_type
return '' unless file.attached?
file&.blob&.content_type
end
def duplicate
new_asset = dup
return unless new_asset.save
duplicate_file(new_asset)
new_asset
end
def duplicate_file(to_asset)
return unless file.attached?
raise ArgumentError, 'Destination asset should be persisted first!' unless to_asset.persisted?
file.blob.open do |tmp_file|
to_blob = ActiveStorage::Blob.create_after_upload!(io: tmp_file, filename: blob.filename, metadata: blob.metadata)
to_asset.file.attach(to_blob)
end
2019-08-05 17:30:36 +08:00
to_asset.post_process_file(to_asset.team)
end
2019-06-28 14:17:09 +08:00
def image?
2019-07-12 21:47:15 +08:00
content_type =~ %r{^image/#{Regexp.union(Constants::WHITELISTED_IMAGE_TYPES)}}
2016-02-12 23:52:43 +08:00
end
2016-07-21 19:11:15 +08:00
def text?
Constants::TEXT_EXTRACT_FILE_TYPES.any? do |v|
file&.blob&.content_type&.start_with? v
end
end
def marvinjs?
file.metadata[:asset_type] == 'marvinjs'
2016-02-12 23:52:43 +08:00
end
2017-01-24 23:34:21 +08:00
def post_process_file(team = nil)
2016-02-12 23:52:43 +08:00
# Update self.empty
update(file_present: true)
2016-02-12 23:52:43 +08:00
# Extract asset text if it's of correct type
if text?
2016-02-12 23:52:43 +08:00
Rails.logger.info "Asset #{id}: Creating extract text job"
# The extract_asset_text also includes
# estimated size calculation
Asset.delay(queue: :assets, run_at: 20.minutes.from_now)
.extract_asset_text_delayed(id, in_template)
elsif marvinjs?
extract_asset_text
2016-02-12 23:52:43 +08:00
else
# Update asset's estimated size immediately
2017-01-24 23:34:21 +08:00
update_estimated_size(team)
2016-02-12 23:52:43 +08:00
end
end
def self.extract_asset_text_delayed(asset_id, in_template = false)
2019-09-23 22:33:57 +08:00
asset = find_by(id: asset_id)
return unless asset.present? && asset.file.attached?
2016-02-12 23:52:43 +08:00
asset.extract_asset_text(in_template)
end
2016-02-12 23:52:43 +08:00
def extract_asset_text(in_template = false)
self.in_template = in_template
2016-02-12 23:52:43 +08:00
if marvinjs?
mjs_doc = Nokogiri::XML(file.metadata[:description])
mjs_doc.remove_namespaces!
text_data = mjs_doc.search("//Field[@name='text']").collect(&:text).join(' ')
else
# Start Tika as a server
Yomu.server(:text) if !ENV['NO_TIKA_SERVER'] && Yomu.class_variable_get(:@@server_pid).nil?
2019-09-23 22:33:57 +08:00
blob.open do |tmp_file|
text_data = Yomu.new(tmp_file.path).text
2016-07-21 19:11:15 +08:00
end
end
2016-07-21 19:11:15 +08:00
if asset_text_datum.present?
# Update existing text datum if it exists
asset_text_datum.update(data: text_data)
else
# Create new text datum
AssetTextDatum.create(data: text_data, asset: self)
2016-02-12 23:52:43 +08:00
end
Rails.logger.info "Asset #{id}: Asset file successfully extracted"
# Finally, update asset's estimated size to include
# the data vector
update_estimated_size(team)
rescue StandardError => e
Rails.logger.fatal(
"Asset #{id}: Error extracting contents from asset "\
"file #{file.blob.key}: #{e.message}"
)
end
2017-01-24 23:34:21 +08:00
# If team is provided, its space_taken
2016-02-12 23:52:43 +08:00
# is updated as well
2017-01-24 23:34:21 +08:00
def update_estimated_size(team = nil)
return if file_size.blank? || in_template
2016-02-12 23:52:43 +08:00
es = file_size
if asset_text_datum.present? && asset_text_datum.persisted?
2016-02-12 23:52:43 +08:00
asset_text_datum.reload
es += get_octet_length_record(asset_text_datum, :data)
es += get_octet_length_record(asset_text_datum, :data_vector)
end
2016-10-07 00:36:55 +08:00
es *= Constants::ASSET_ESTIMATED_SIZE_FACTOR
2016-02-12 23:52:43 +08:00
update(estimated_size: es)
Rails.logger.info "Asset #{id}: Estimated size successfully calculated"
2017-01-24 23:34:21 +08:00
# Finally, update team's space
if team.present?
team.take_space(es)
team.save
2016-02-12 23:52:43 +08:00
end
end
def can_perform_action(action)
if ENV['WOPI_ENABLED'] == 'true'
file_ext = file_name.split('.').last
if file_ext == 'wopitest' &&
(!ENV['WOPI_TEST_ENABLED'] || ENV['WOPI_TEST_ENABLED'] == 'false')
return false
end
action = get_action(file_ext, action)
return false if action.nil?
true
else
false
end
end
def get_action_url(user, action, with_tokens = true)
file_ext = file_name.split('.').last
action = get_action(file_ext, action)
2016-08-03 21:31:25 +08:00
if !action.nil?
action_url = action.urlsrc
if ENV['WOPI_BUSINESS_USERS'] && ENV['WOPI_BUSINESS_USERS'] == 'true'
action_url = action_url.gsub(/<IsLicensedUser=BUSINESS_USER&>/,
2017-07-04 23:13:59 +08:00
'IsLicensedUser=1&')
action_url = action_url.gsub(/<IsLicensedUser=BUSINESS_USER>/,
2017-07-04 23:13:59 +08:00
'IsLicensedUser=1')
else
action_url = action_url.gsub(/<IsLicensedUser=BUSINESS_USER&>/,
2017-07-04 23:13:59 +08:00
'IsLicensedUser=0&')
action_url = action_url.gsub(/<IsLicensedUser=BUSINESS_USER>/,
2017-07-04 23:13:59 +08:00
'IsLicensedUser=0')
end
action_url = action_url.gsub(/<.*?=.*?>/, '')
rest_url = Rails.application.routes.url_helpers.wopi_rest_endpoint_url(
host: ENV['WOPI_ENDPOINT_URL'],
id: id
)
action_url += "WOPISrc=#{rest_url}"
if with_tokens
token = user.get_wopi_token
action_url + "&access_token=#{token.token}"\
"&access_token_ttl=#{(token.ttl * 1000)}"
else
action_url
end
2016-08-03 21:31:25 +08:00
else
return nil
end
end
2016-09-29 18:19:29 +08:00
def favicon_url(action)
file_ext = file_name.split('.').last
2016-09-29 18:19:29 +08:00
action = get_action(file_ext, action)
action.wopi_app.icon if action.try(:wopi_app)
2016-09-29 18:19:29 +08:00
end
# locked?, lock_asset and refresh_lock rely on the asset
# being locked in the database to prevent race conditions
def locked?
unlock_expired
!lock.nil?
end
def lock_asset(lock_string)
self.lock = lock_string
self.lock_ttl = Time.now.to_i + LOCK_DURATION
save!
end
def refresh_lock
self.lock_ttl = Time.now.to_i + LOCK_DURATION
save!
end
def unlock
self.lock = nil
self.lock_ttl = nil
save!
end
def unlock_expired
with_lock do
if !lock_ttl.nil? && lock_ttl < Time.now.to_i
self.lock = nil
self.lock_ttl = nil
save!
end
end
end
def update_contents(new_file)
2019-10-09 03:34:16 +08:00
file.attach(io: new_file, filename: file_name)
self.version = version.nil? ? 1 : version + 1
save
end
def editable_image?
!locked? && %r{^image/#{Regexp.union(Constants::WHITELISTED_IMAGE_TYPES_EDITABLE)}} =~ file.content_type
end
def generate_base64(style)
return convert_variant_to_base64(medium_preview) if style == :medium
2016-02-12 23:52:43 +08:00
end
private
def tempdir
Rails.root.join('tmp')
end
2019-06-28 14:17:09 +08:00
def previewable_image?
file.blob&.content_type =~ %r{^image/#{Regexp.union(Constants::WHITELISTED_IMAGE_TYPES)}}
2016-02-12 23:52:43 +08:00
end
def step_or_result_or_repository_asset_value
2016-02-12 23:52:43 +08:00
# We must allow both step and result to be blank because of GUI
# (even though it's not really a "valid" asset)
2018-03-10 00:04:54 +08:00
if step.present? && result.present? ||
step.present? && repository_asset_value.present? ||
result.present? && repository_asset_value.present?
errors.add(
:base,
'Asset can only be result or step or repository cell, not ever.'
)
2016-02-12 23:52:43 +08:00
end
end
def wopi_filename_valid
# Check that filename without extension is not blank
2019-09-23 22:33:57 +08:00
if file_name[0..-6].blank?
errors.add(
:file,
I18n.t('general.text.not_blank')
)
end
# Check maximum filename length
if file_name.length > Constants::FILENAME_MAX_LENGTH
errors.add(
:file,
I18n.t(
'general.file.file_name_too_long',
limit: Constants::FILENAME_MAX_LENGTH
)
)
end
end
2016-02-12 23:52:43 +08:00
end