Class: Aspera::Cli::Plugins::Preview
- Inherits:
-
BasicAuthPlugin
- Object
- Aspera::Cli::Plugin
- BasicAuthPlugin
- Aspera::Cli::Plugins::Preview
- Defined in:
- lib/aspera/cli/plugins/preview.rb
Constant Summary collapse
- ACTIONS =
i[scan events trevents check test].freeze
Constants inherited from Aspera::Cli::Plugin
Aspera::Cli::Plugin::ALL_OPS, Aspera::Cli::Plugin::GLOBAL_OPS, Aspera::Cli::Plugin::INSTANCE_OPS, Aspera::Cli::Plugin::MAX_ITEMS, Aspera::Cli::Plugin::MAX_PAGES, Aspera::Cli::Plugin::REGEX_LOOKUP_ID_BY_FIELD, Aspera::Cli::Plugin::VAL_ALL
Instance Attribute Summary collapse
-
#option_file_access ⇒ Object
Returns the value of attribute option_file_access.
-
#option_folder_reset_cache ⇒ Object
Returns the value of attribute option_folder_reset_cache.
-
#option_overwrite ⇒ Object
Returns the value of attribute option_overwrite.
-
#option_previews_folder ⇒ Object
option_skip_format has special accessors.
-
#option_skip_folders ⇒ Object
Returns the value of attribute option_skip_folders.
Instance Method Summary collapse
- #do_transfer(direction, folder_id, source_filename, destination = '/') ⇒ Object
-
#entry_preview_folder_name(entry) ⇒ Object
defined by node api.
- #execute_action ⇒ Object
-
#generate_preview(entry) ⇒ Object
generate preview files for one folder entry (file) if necessary entry must contain “parent_file_id” if remote.
-
#get_folder_entries(file_id, request_args = nil) ⇒ Object
/files/id/files is normally cached in redis, but we can discard the cache but /files/id is not cached.
- #get_infos_local(gen_infos, entry) ⇒ Object
- #get_infos_remote(gen_infos, entry) ⇒ Object
-
#initialize(env) ⇒ Preview
constructor
A new instance of Preview.
- #option_skip_format ⇒ Object
- #option_skip_format=(value) ⇒ Object
- #option_skip_types ⇒ Object
- #option_skip_types=(value) ⇒ Object
- #preview_filename(preview_format, filename = nil) ⇒ Object
-
#process_events(iteration_persistency) ⇒ Object
requests recent events on node api and process newly modified folders.
-
#process_trevents(iteration_persistency) ⇒ Object
old version based on folders.
-
#scan_folder_files(top_entry, scan_start = nil) ⇒ Object
scan all files in provided folder entry.
Methods inherited from BasicAuthPlugin
#basic_auth_api, #basic_auth_params, register_options
Methods inherited from Aspera::Cli::Plugin
#do_bulk_operation, #entity_action, #entity_command, #instance_identifier, #old_query_read_delete, #query_read_delete, #value_create_modify, #value_or_query
Constructor Details
#initialize(env) ⇒ Preview
Returns a new instance of Preview.
46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 |
# File 'lib/aspera/cli/plugins/preview.rb', line 46 def initialize(env) super(env) @skip_types = [] @default_transfer_spec = nil # by default generate all supported formats (clone, as altered by options) @preview_formats_to_generate = Aspera::Preview::Generator::PREVIEW_FORMATS.clone # options for generation = Aspera::Preview::Options.new # used to trigger periodic processing @periodic = TimerLimiter.new(LOG_LIMITER_SEC) # link CLI options to gen_info attributes .declare( :skip_format, 'Skip this preview format (multiple possible)', values: Aspera::Preview::Generator::PREVIEW_FORMATS, handler: {o: self, m: :option_skip_format}, default: []) .declare( :folder_reset_cache, 'Force detection of generated preview by refresh cache', values: i[no header read], handler: {o: self, m: :option_folder_reset_cache}, default: :no) .declare(:skip_types, 'Skip types in comma separated list', handler: {o: self, m: :option_skip_types}) .declare(:previews_folder, 'Preview folder in storage root', handler: {o: self, m: :option_previews_folder}, default: DEFAULT_PREVIEWS_FOLDER) .declare(:temp_folder, 'Path to temp folder', default: Dir.tmpdir) .declare(:skip_folders, 'List of folder to skip', handler: {o: self, m: :option_skip_folders}, default: []) .declare(:case, 'Basename of output for for test') .declare(:scan_path, 'Subpath in folder id to start scan in (default=/)') .declare(:scan_id, 'Folder id in storage to start scan in, default is access key main folder id') .declare(:mimemagic, 'Use Mime type detection of gem mimemagic', values: :bool, default: false) .declare(:overwrite, 'When to overwrite result file', values: i[always never mtime], handler: {o: self, m: :option_overwrite}, default: :mtime) .declare( :file_access, 'How to read and write files in repository', values: i[local remote], handler: {o: self, m: :option_file_access}, default: :local) # add other options for generator (and set default values) Aspera::Preview::Options::DESCRIPTIONS.each do |opt| values = if opt.key?(:values) opt[:values] elsif Cli::Manager::BOOLEAN_SIMPLE.include?(opt[:default]) :bool end .declare(opt[:name], opt[:description].capitalize, values: values, handler: {o: , m: opt[:name]}, default: opt[:default]) end . raise 'skip_folder shall be an Array, use @json:[...]' unless @option_skip_folders.is_a?(Array) @tmp_folder = File.join(.get_option(:temp_folder, mandatory: true), "#{TMP_DIR_PREFIX}.#{SecureRandom.uuid}") FileUtils.mkdir_p(@tmp_folder) Log.log.debug{"tmpdir: #{@tmp_folder}"} end |
Instance Attribute Details
#option_file_access ⇒ Object
Returns the value of attribute option_file_access.
44 45 46 |
# File 'lib/aspera/cli/plugins/preview.rb', line 44 def option_file_access @option_file_access end |
#option_folder_reset_cache ⇒ Object
Returns the value of attribute option_folder_reset_cache.
44 45 46 |
# File 'lib/aspera/cli/plugins/preview.rb', line 44 def option_folder_reset_cache @option_folder_reset_cache end |
#option_overwrite ⇒ Object
Returns the value of attribute option_overwrite.
44 45 46 |
# File 'lib/aspera/cli/plugins/preview.rb', line 44 def option_overwrite @option_overwrite end |
#option_previews_folder ⇒ Object
option_skip_format has special accessors
43 44 45 |
# File 'lib/aspera/cli/plugins/preview.rb', line 43 def option_previews_folder @option_previews_folder end |
#option_skip_folders ⇒ Object
Returns the value of attribute option_skip_folders.
44 45 46 |
# File 'lib/aspera/cli/plugins/preview.rb', line 44 def option_skip_folders @option_skip_folders end |
Instance Method Details
#do_transfer(direction, folder_id, source_filename, destination = '/') ⇒ Object
207 208 209 210 211 212 213 214 215 216 |
# File 'lib/aspera/cli/plugins/preview.rb', line 207 def do_transfer(direction, folder_id, source_filename, destination='/') raise 'Internal ERROR' if destination.nil? && direction.eql?(Fasp::TransferSpec::DIRECTION_RECEIVE) t_spec = @api_node.transfer_spec_gen4(folder_id, direction, { 'paths' => [{'source' => source_filename}], 'tags' => {Fasp::TransferSpec::TAG_RESERVED => {PREV_GEN_TAG => true}} }) # force destination, need to set this in transfer agent else it gets overwritten, not do: t_spec['destination_root']=destination transfer.option_transfer_spec_deep_merge({'destination_root' => destination}) Main.result_transfer(transfer.start(t_spec)) end |
#entry_preview_folder_name(entry) ⇒ Object
defined by node api
254 255 256 |
# File 'lib/aspera/cli/plugins/preview.rb', line 254 def entry_preview_folder_name(entry) "#{entry['id']}#{PREVIEW_FOLDER_SUFFIX}" end |
#execute_action ⇒ Object
391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 |
# File 'lib/aspera/cli/plugins/preview.rb', line 391 def execute_action command = .get_next_command(ACTIONS) unless i[check test].include?(command) # this will use node api @api_node = Aspera::Node.new(params: basic_auth_params) @transfer_server_address = URI.parse(@api_node.params[:base_url]).host # get current access key @access_key_self = @api_node.read('access_keys/self')[:data] # TODO: check events is activated here: # note that docroot is good to look at as well node_info = @api_node.read('info')[:data] Log.log.debug{"root: #{node_info['docroot']}"} @access_remote = @option_file_access.eql?(:remote) Log.log.debug{"remote: #{@access_remote}"} Log.log.debug{"access key info: #{@access_key_self}"} # TODO: can the previews folder parameter be read from node api ? @option_skip_folders.push('/' + @option_previews_folder) if @access_remote # NOTE: the filter "name", it's why we take the first one @previews_folder_entry = get_folder_entries(@access_key_self['root_file_id'], {name: @option_previews_folder}).first raise CliError, "Folder #{@option_previews_folder} does not exist on node. "\ 'Please create it in the storage root, or specify an alternate name.' if @previews_folder_entry.nil? else raise 'only local storage allowed in this mode' unless @access_key_self['storage']['type'].eql?('local') @local_storage_root = @access_key_self['storage']['path'] # TODO: option to override @local_storage_root='xxx' @local_storage_root = @local_storage_root[PVCL_LOCAL_STORAGE.length..-1] if @local_storage_root.start_with?(PVCL_LOCAL_STORAGE) # TODO: windows could have "C:" ? raise "not local storage: #{@local_storage_root}" unless @local_storage_root.start_with?('/') raise CliError, "Local storage root folder #{@local_storage_root} does not exist." unless File.directory?(@local_storage_root) @local_preview_folder = File.join(@local_storage_root, @option_previews_folder) raise CliError, "Folder #{@local_preview_folder} does not exist locally. "\ 'Please create it, or specify an alternate name.' unless File.directory?(@local_preview_folder) # protection to avoid clash of file id for two different access keys marker_file = File.join(@local_preview_folder, AK_MARKER_FILE) Log.log.debug{"marker file: #{marker_file}"} if File.exist?(marker_file) ak = File.read(marker_file).chomp raise "mismatch access key in #{marker_file}: contains #{ak}, using #{@access_key_self['id']}" unless @access_key_self['id'].eql?(ak) else File.write(marker_file, @access_key_self['id']) end end end Aspera::Preview::FileTypes.instance.use_mimemagic = .get_option(:mimemagic, mandatory: true) # check tools that are anyway required for all cases Aspera::Preview::Utils.check_tools(@skip_types) case command when :scan scan_path = .get_option(:scan_path) scan_id = .get_option(:scan_id) # by default start at root folder_info = if scan_id.nil? { 'id' => @access_key_self['root_file_id'], 'name' => '/', 'type' => 'folder', 'path' => '/' } else @api_node.read("files/#{scan_id}")[:data] end scan_folder_files(folder_info, scan_path) return Main.result_status('scan finished') when :events, :trevents iteration_persistency = nil if .get_option(:once_only, mandatory: true) iteration_persistency = PersistencyActionOnce.new( manager: @agents[:persistency], data: [], id: IdGenerator.from_list([ 'preview_iteration', command.to_s, .get_option(:url, mandatory: true), .get_option(:username, mandatory: true) ])) end # call processing method specified by command line command send("process_#{command}", iteration_persistency) return Main.result_status("#{command} finished") when :check return Main.result_status('Tools validated') when :test format = .get_next_argument('format', expected: Aspera::Preview::Generator::PREVIEW_FORMATS) source = .get_next_argument('source file') dest = preview_filename(format, .get_option(:case)) g = Aspera::Preview::Generator.new(, source, dest, @tmp_folder, nil) raise "cannot find file type for #{source}" if g.conversion_type.nil? raise "out format #{format} not supported" unless g.supported? g.generate return Main.result_status("generated: #{dest}") else raise 'error' end ensure Log.log.debug{"cleaning up temp folder #{@tmp_folder}"} FileUtils.rm_rf(@tmp_folder) end |
#generate_preview(entry) ⇒ Object
generate preview files for one folder entry (file) if necessary entry must contain “parent_file_id” if remote.
265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 |
# File 'lib/aspera/cli/plugins/preview.rb', line 265 def generate_preview(entry) # prepare generic information gen_infos = @preview_formats_to_generate.map do |preview_format| { preview_format: preview_format, base_dest: preview_filename(preview_format) } end # lets gather some infos on possibly existing previews # it depends if files access locally or remotely # folder where previews will be generated for this particular entry local_entry_preview_dir = @access_remote ? get_infos_remote(gen_infos, entry) : get_infos_local(gen_infos, entry) # here we have the status on preview files # let's find if they need generation gen_infos.select! do |gen_info| # if it exists, what about overwrite policy ? if gen_info[:preview_exist] case @option_overwrite when :always # continue: generate when :never # never overwrite next false when :mtime # skip if preview is newer than original next false if gen_info[:preview_newer_than_original] end end # need generator for further checks gen_info[:generator] = Aspera::Preview::Generator.new(, gen_info[:src], gen_info[:dst], @tmp_folder, entry['content_type']) # get conversion_type (if known) and check if supported next false unless gen_info[:generator].supported? # shall we skip it ? next false if @skip_types.include?(gen_info[:generator].conversion_type) # ok we need to generate true end return if gen_infos.empty? # create folder if needed FileUtils.mkdir_p(local_entry_preview_dir) if @access_remote raise 'missing parent_file_id in entry' if entry['parent_file_id'].nil? # download original file to temp folder do_transfer(Fasp::TransferSpec::DIRECTION_RECEIVE, entry['parent_file_id'], entry['name'], @tmp_folder) end Log.log.info{"source: #{entry['id']}: #{entry['path']})"} gen_infos.each do |gen_info| gen_info[:generator].generate rescue nil end if @access_remote # upload do_transfer(Fasp::TransferSpec::DIRECTION_SEND, @previews_folder_entry['id'], local_entry_preview_dir) # cleanup after upload FileUtils.rm_rf(local_entry_preview_dir) File.delete(File.join(@tmp_folder, entry['name'])) end # force read file updated previews if @option_folder_reset_cache.eql?(:read) @api_node.read("files/#{entry['id']}") end rescue StandardError => e Log.log.error{"Ignore: #{e.message}"} Log.log.debug(e.backtrace.join("\n").red) end |
#get_folder_entries(file_id, request_args = nil) ⇒ Object
/files/id/files is normally cached in redis, but we can discard the cache but /files/id is not cached
120 121 122 123 124 125 |
# File 'lib/aspera/cli/plugins/preview.rb', line 120 def get_folder_entries(file_id, request_args=nil) headers = {'Accept' => 'application/json'} headers['X-Aspera-Cache-Control'] = 'no-cache' if @option_folder_reset_cache.eql?(:header) return @api_node.call({operation: 'GET', subpath: "files/#{file_id}/files", headers: headers, url_params: request_args})[:data] # return @api_node.read("files/#{file_id}/files",request_args)[:data] end |
#get_infos_local(gen_infos, entry) ⇒ Object
218 219 220 221 222 223 224 225 226 227 228 229 230 |
# File 'lib/aspera/cli/plugins/preview.rb', line 218 def get_infos_local(gen_infos, entry) local_original_filepath = File.join(@local_storage_root, entry['path']) original_mtime = File.mtime(local_original_filepath) # out local_entry_preview_dir = File.join(@local_preview_folder, entry_preview_folder_name(entry)) gen_infos.each do |gen_info| gen_info[:src] = local_original_filepath gen_info[:dst] = File.join(local_entry_preview_dir, gen_info[:base_dest]) gen_info[:preview_exist] = File.exist?(gen_info[:dst]) gen_info[:preview_newer_than_original] = (gen_info[:preview_exist] && (File.mtime(gen_info[:dst]) > original_mtime)) end return local_entry_preview_dir end |
#get_infos_remote(gen_infos, entry) ⇒ Object
232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 |
# File 'lib/aspera/cli/plugins/preview.rb', line 232 def get_infos_remote(gen_infos, entry) # store source directly here local_original_filepath = File.join(@tmp_folder, entry['name']) # original_mtime=DateTime.parse(entry['modified_time']) # out: where previews are generated local_entry_preview_dir = File.join(@tmp_folder, entry_preview_folder_name(entry)) file_info = @api_node.read("files/#{entry['id']}")[:data] # TODO: this does not work because previews is hidden in api (gen4) # this_preview_folder_entries=get_folder_entries(@previews_folder_entry['id'],{name: @entry_preview_folder_name}) # TODO: use gen3 api to list files and get date gen_infos.each do |gen_info| gen_info[:src] = local_original_filepath gen_info[:dst] = File.join(local_entry_preview_dir, gen_info[:base_dest]) # TODO: use this_preview_folder_entries (but it's hidden) gen_info[:preview_exist] = file_info.key?('preview') # TODO: get change time and compare, useful ? gen_info[:preview_newer_than_original] = gen_info[:preview_exist] end return local_entry_preview_dir end |
#option_skip_format ⇒ Object
114 115 116 |
# File 'lib/aspera/cli/plugins/preview.rb', line 114 def option_skip_format return @preview_formats_to_generate.map(&:to_s).join(',') end |
#option_skip_format=(value) ⇒ Object
110 111 112 |
# File 'lib/aspera/cli/plugins/preview.rb', line 110 def option_skip_format=(value) @preview_formats_to_generate.delete(value) end |
#option_skip_types ⇒ Object
106 107 108 |
# File 'lib/aspera/cli/plugins/preview.rb', line 106 def option_skip_types return @skip_types.map(&:to_s).join(',') end |
#option_skip_types=(value) ⇒ Object
97 98 99 100 101 102 103 104 |
# File 'lib/aspera/cli/plugins/preview.rb', line 97 def option_skip_types=(value) @skip_types = [] value.split(',').each do |v| s = v.to_sym raise "not supported: #{v}" unless Aspera::Preview::FileTypes::CONVERSION_TYPES.include?(s) @skip_types.push(s) end end |
#preview_filename(preview_format, filename = nil) ⇒ Object
258 259 260 261 |
# File 'lib/aspera/cli/plugins/preview.rb', line 258 def preview_filename(preview_format, filename=nil) filename ||= PREVIEW_BASENAME return "#{filename}.#{preview_format}" end |
#process_events(iteration_persistency) ⇒ Object
requests recent events on node api and process newly modified folders
171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 |
# File 'lib/aspera/cli/plugins/preview.rb', line 171 def process_events(iteration_persistency) # get new file creation by access key (TODO: what if file already existed?) events_filter = { 'access_key' => @access_key_self['id'], 'type' => 'file.*' } # optionally add iteration token from persistency events_filter['iteration_token'] = iteration_persistency.data.first unless iteration_persistency.nil? events = @api_node.read('events', events_filter)[:data] return if events.empty? events.each do |event| # process only files if event.dig('data', 'type').eql?('file') file_entry = @api_node.read("files/#{event['data']['id']}")[:data] rescue nil if !file_entry.nil? && @option_skip_folders.select{|d|file_entry['path'].start_with?(d)}.empty? file_entry['parent_file_id'] = event['data']['parent_file_id'] if event['types'].include?('file.deleted') Log.log.error('TODO'.red) end if event['types'].include?('file.deleted') generate_preview(file_entry) end end end # log/persist periodically or last one next unless @periodic.trigger? || event.equal?(events.last) Log.log.info{"Processing event #{event['id']}"} # save checkpoint to avoid losing processing in case of error if !iteration_persistency.nil? iteration_persistency.data[0] = event['id'].to_s iteration_persistency.save end end end |
#process_trevents(iteration_persistency) ⇒ Object
old version based on folders
129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 |
# File 'lib/aspera/cli/plugins/preview.rb', line 129 def process_trevents(iteration_persistency) events_filter = { 'access_key' => @access_key_self['id'], 'type' => 'download.ended' } # optionally add iteration token from persistency events_filter['iteration_token'] = iteration_persistency.data.first unless iteration_persistency.nil? begin events = @api_node.read('events', events_filter)[:data] rescue RestCallError => e if e..include?('Invalid iteration_token') Log.log.warn{"Retrying without iteration token: #{e}"} events_filter.delete('iteration_token') retry end raise e end return if events.empty? events.each do |event| if event['data']['direction'].eql?(Fasp::TransferSpec::DIRECTION_RECEIVE) && event['data']['status'].eql?('completed') && event['data']['error_code'].eql?(0) && event['data'].dig('tags', Fasp::TransferSpec::TAG_RESERVED, PREV_GEN_TAG).nil? folder_id = event.dig('data', 'tags', Fasp::TransferSpec::TAG_RESERVED, 'node', 'file_id') folder_id ||= event.dig('data', 'file_id') if !folder_id.nil? folder_entry = @api_node.read("files/#{folder_id}")[:data] rescue nil scan_folder_files(folder_entry) unless folder_entry.nil? end end # log/persist periodically or last one next unless @periodic.trigger? || event.equal?(events.last) Log.log.info{"Processed event #{event['id']}"} # save checkpoint to avoid losing processing in case of error if !iteration_persistency.nil? iteration_persistency.data[0] = event['id'].to_s iteration_persistency.save end end end |
#scan_folder_files(top_entry, scan_start = nil) ⇒ Object
scan all files in provided folder entry
332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 |
# File 'lib/aspera/cli/plugins/preview.rb', line 332 def scan_folder_files(top_entry, scan_start=nil) if !scan_start.nil? # canonical path: start with / and ends with / scan_start = '/' + scan_start.split('/').reject(&:empty?).join('/') scan_start = "#{scan_start}/" # unless scan_start.end_with?('/') end filter_block = Aspera::Node.file_matcher(value_or_query(allowed_types: String)) Log.log.debug{"scan: #{top_entry} : #{scan_start}".green} # don't use recursive call, use list instead entries_to_process = [top_entry] until entries_to_process.empty? entry = entries_to_process.shift # process this entry only if it is within the scan_start entry_path_with_slash = entry['path'] Log.log.info{"processing entry #{entry_path_with_slash}"} if @periodic.trigger? entry_path_with_slash = "#{entry_path_with_slash}/" unless entry_path_with_slash.end_with?('/') if !scan_start.nil? && !scan_start.start_with?(entry_path_with_slash) && !entry_path_with_slash.start_with?(scan_start) Log.log.debug{"#{entry['path']} folder (skip start)".bg_red} next end Log.log.debug{"item:#{entry}"} begin case entry['type'] when 'file' if filter_block.call(entry) generate_preview(entry) else Log.log.debug('skip by filter') end when 'link' Log.log.debug('Ignoring link.') when 'folder' if @option_skip_folders.include?(entry['path']) Log.log.debug{"#{entry['path']} folder (skip list)".bg_red} else Log.log.debug{"#{entry['path']} folder".green} # get folder content folder_entries = get_folder_entries(entry['id']) # process all items in current folder folder_entries.each do |folder_entry| # add path for older versions of ES if !folder_entry.key?('path') folder_entry['path'] = entry_path_with_slash + folder_entry['name'] end folder_entry['parent_file_id'] = entry['id'] entries_to_process.push(folder_entry) end end else Log.log.warn{"unknown entry type: #{entry['type']}"} end rescue StandardError => e Log.log.warn{"An error occurred: #{e}, ignoring"} end end end |