Module: LogStash::Util::FileTools

Extended by:: FileTools

Included in:: FileTools

Defined in:: lib/logstash/util/filetools.rb

Instance Method Summary collapse

Instance Method Details

permalink #do_ungz(file) ⇒ `Object`

def untar

# File 'lib/logstash/util/filetools.rb', line 128

def do_ungz(file)

  outpath = file.gsub('.gz', '')
  tgz = Zlib::GzipReader.new(File.open(file))
  begin
    File.open(outpath, "w") do |out|
      IO::copy_stream(tgz, out)
    end
    File.unlink(file)
  rescue
    File.unlink(outpath) if File.file?(outpath)
   raise
  end
  tgz.close
end

permalink #download(url, output) ⇒ `Object`

[View source]

# File 'lib/logstash/util/filetools.rb', line 49

def download(url, output)
  uri = URI(url)
  digest = Digest::SHA1.new
  tmp = "#{output}.tmp"
  Net::HTTP.start(uri.host, uri.port, :use_ssl => (uri.scheme == "https")) do |http|
    request = Net::HTTP::Get.new(uri.path)
    http.request(request) do |response|
      fail "HTTP fetch failed for #{url}. #{response}" if [200, 301].include?(response.code)
      size = (response["content-length"].to_i || -1).to_f
      count = 0
      File.open(tmp, "w") do |fd|
        response.read_body do |chunk|
          fd.write(chunk)
          digest << chunk
          if size > 0 && $stdout.tty?
            count += chunk.bytesize
            $stdout.write(sprintf("\r%0.2f%%", count/size * 100))
          end
        end
      end
      $stdout.write("\r      \r") if $stdout.tty?
    end
  end

  File.rename(tmp, output)

  return digest.hexdigest
rescue SocketError => e
  puts "Failure while downloading #{url}: #{e}"
  raise
ensure
  File.unlink(tmp) if File.exist?(tmp)
end

permalink #eval_file(entry, files, prefix) ⇒ `Object`

[View source]

# File 'lib/logstash/util/filetools.rb', line 144

def eval_file(entry, files, prefix)
  return false if entry.full_name =~ /PaxHeaders/
  if !files.nil?
    if files.is_a?(Array)
      return false unless files.include?(entry.full_name.gsub(prefix, ''))
      entry.full_name.split("/").last
    elsif files.is_a?(String)
      return false unless entry.full_name =~ Regexp.new(files)
      entry.full_name.split("/").last
    end
  else
    entry.full_name.gsub(prefix, '')
  end
end

permalink #fetch(url, sha1, output) ⇒ `Object`

[View source]

# File 'lib/logstash/util/filetools.rb', line 10

def fetch(url, sha1, output)

  puts "Downloading #{url}"
  actual_sha1 = download(url, output)

  if actual_sha1 != sha1
    fail "SHA1 does not match (expected '#{sha1}' but got '#{actual_sha1}')"
  end
end

permalink #file_fetch(url, sha1, target) ⇒ `Object`

def fetch

[View source]

# File 'lib/logstash/util/filetools.rb', line 20

def file_fetch(url, sha1, target)
  filename = File.basename( URI(url).path )
  output = "#{target}/#{filename}"
  begin
    actual_sha1 = file_sha1(output)
    if actual_sha1 != sha1
      fetch(url, sha1, output)
    end
  rescue Errno::ENOENT
    fetch(url, sha1, output)
  end
  return output
end

permalink #file_sha1(path) ⇒ `Object`

[View source]

# File 'lib/logstash/util/filetools.rb', line 34

def file_sha1(path)
  digest = Digest::SHA1.new
  fd = File.new(path, "r")
  while true
    begin
      digest << fd.sysread(16384)
    rescue EOFError
      break
    end
  end
  return digest.hexdigest
ensure
  fd.close if fd
end

permalink #process_downloads(files, target = '') ⇒ `Object`

[View source]

# File 'lib/logstash/util/filetools.rb', line 159

def process_downloads(files,target='')

  FileUtils.mkdir_p(target) unless File.directory?(target)

  files.each do |file|
    download = file_fetch(file['url'], file['sha1'],target)

    if download =~ /.tar.gz/
      prefix = download.gsub('.tar.gz', '').gsub("#{target}/", '')
      untar(download) do |entry|
        next unless out = eval_file(entry, file['files'], prefix)
        File.join(target, out)
      end

    elsif download =~ /.tgz/
      prefix = download.gsub('.tgz', '').gsub("#{target}/", '')
      untar(download) do |entry|
        next unless out = eval_file(entry, file['files'], prefix)
        File.join(target, out)
      end

    elsif download =~ /.gz/
      do_ungz(download)
    end
  end
end

permalink #untar(tarball, &block) ⇒ `Object`

def download

[View source]

# File 'lib/logstash/util/filetools.rb', line 83

def untar(tarball, &block)
  require "archive/tar/minitar"
  tgz = Zlib::GzipReader.new(File.open(tarball))
  # Pull out typesdb
  tar = Archive::Tar::Minitar::Input.open(tgz)
  tar.each do |entry|
    path = block.call(entry)
    next if path.nil?
    parent = File.dirname(path)

    FileUtils.mkdir_p(parent) unless File.directory?(parent)

    # Skip this file if the output file is the same size
    if entry.directory?
      FileUtils.mkdir_p(path) unless File.directory?(path)
    else
      entry_mode = entry.instance_eval { @mode } & 0777
      if File.exists?(path)
        stat = File.stat(path)
        # TODO(sissel): Submit a patch to archive-tar-minitar upstream to
        # expose headers in the entry.
        entry_size = entry.instance_eval { @size }
        # If file sizes are same, skip writing.
        next if stat.size == entry_size && (stat.mode & 0777) == entry_mode
      end
      puts "Extracting #{entry.full_name} from #{tarball} #{entry_mode.to_s(8)}"
      File.open(path, "w") do |fd|
        # eof? check lets us skip empty files. Necessary because the API provided by
        # Archive::Tar::Minitar::Reader::EntryStream only mostly acts like an
        # IO object. Something about empty files in this EntryStream causes
        # IO.copy_stream to throw "can't convert nil into String" on JRuby
        # TODO(sissel): File a bug about this.
        while !entry.eof?
          chunk = entry.read(16384)
          fd.write(chunk)
        end
          #IO.copy_stream(entry, fd)
      end
      File.chmod(entry_mode, path)
    end
  end
  tar.close
  File.unlink(tarball) if File.file?(tarball)
end

Module: LogStash::Util::FileTools

Instance Method Summary collapse

Instance Method Details

permalink #do_ungz(file) ⇒ Object

permalink #download(url, output) ⇒ Object

permalink #eval_file(entry, files, prefix) ⇒ Object

permalink #fetch(url, sha1, output) ⇒ Object

permalink #file_fetch(url, sha1, target) ⇒ Object

permalink #file_sha1(path) ⇒ Object

permalink #process_downloads(files, target = '') ⇒ Object

permalink #untar(tarball, &block) ⇒ Object

permalink #do_ungz(file) ⇒ `Object`

permalink #download(url, output) ⇒ `Object`

permalink #eval_file(entry, files, prefix) ⇒ `Object`

permalink #fetch(url, sha1, output) ⇒ `Object`

permalink #file_fetch(url, sha1, target) ⇒ `Object`

permalink #file_sha1(path) ⇒ `Object`

permalink #process_downloads(files, target = '') ⇒ `Object`

permalink #untar(tarball, &block) ⇒ `Object`