Class: Ameblogazo::Gazo

Inherits:

Object

Object
Ameblogazo::Gazo

show all

Defined in:: lib/ameblogazo.rb

Defined Under Namespace

Classes: Driver, GazoException, SeleniumDriver, WebkitDriver

Instance Method Summary collapse

#_check_options(options) ⇒ Object

オプションチェック.
#_find_image_url(ameba_id) ⇒ Object

一番最初の画像のURLを取得する.
#_get_info(dir, categorize) ⇒ Object

ダウンロード対象のURLや保存先を取得.
#_init_driver(selenium) ⇒ Object

driver初期化.
#_next_page ⇒ Object

次にダウンロードするべき画像を開く.
#_save_img(url, file) ⇒ Object

画像をダウンロードして保存.
#fetch(options) ⇒ Object

画像を保存する :ameba_id => アメーバID :dir => 保存先ディレクトリ :categorize => タイトル毎などに分類する（デフォルト無効）[nil, “title”, “date”] :num => 取得する枚数（新しいものから順番に）.
#info(options) ⇒ Object

画像の情報を取得する.

Instance Method Details

#_check_options(options) ⇒ `Object`

オプションチェック

# File 'lib/ameblogazo.rb', line 33

def _check_options(options)
  if options.nil? or !options.is_a?(Hash)
    raise GazoException, "オプションがnil、もしくはハッシュじゃないです"
  end
  if options[:dir].nil?
    raise GazoException, "ディレクトリ(:dir)を指定してください"
  end
  if options[:num]
    options[:num] = options[:num].to_s
    if (/^\d+$/ =~ options[:num]).nil?
      raise GazoException, "数値じゃないです"
      return
    end
    options[:num] = options[:num].to_i
  end
  options
end

#_find_image_url(ameba_id) ⇒ `Object`

一番最初の画像のURLを取得する

# File 'lib/ameblogazo.rb', line 61

def _find_image_url(ameba_id)
  puts "検索中..."
  image_url = nil
  catch :image_found do
    100.times do |i|
      page = i+1
      url = "http://ameblo.jp/#{ameba_id}/page-#{page}.html"
      begin
        html = open(url)
      rescue
        raise GazoException, "画像が見つからなかったです"
      end
      doc = Nokogiri::HTML(html)
      
      # 有効なameba_idか確認
      sorry = doc.xpath("//body[@class='sorry']")
      unless sorry.empty?
        raise GazoException, "存在しないIDです"
      end
      
      a = doc.xpath("//a")
      a.each do |node|
        if /http:\/\/ameblo.jp\/#{ameba_id}\/image-\d{11}-\d{11}.html/ =~ node[:href]
          image_url = node[:href]
          throw :image_found
        end
      end
      sleep(0.1)
    end
  end
  # 念のためチェック
  if image_url.nil?
    raise GazoException, "画像がみつからなかったです"
  end
  image_url
end

#_get_info(dir, categorize) ⇒ `Object`

ダウンロード対象のURLや保存先を取得

# File 'lib/ameblogazo.rb', line 99

def _get_info(dir, categorize)
  img = @driver.find(:xpath, '//img[@id="imgItem"]')
  download_url = img[:src]
  filename = File.basename(download_url)
  title = @driver.find("#entryLink").text
  date = download_url[/\d{8}/]
  
  # カテゴリー分け（タイトルとか日付）
  if categorize == "title"
    dir = "#{dir}/#{title}"
  elsif categorize == "date"
    if date
      dir = "#{dir}/#{date}"
    else
      puts "うまく日付がとれなかったのでカテゴライズせずに保存します"
    end
  end
  
  # ディレクトリが存在しなければ作成する
  unless File.directory?(dir)
    print "ディレクトリを作成します #{dir}\n"
    FileUtils.mkdir_p(dir)
  end
  download_file = "#{dir}/#{filename}"
  {:url=>download_url, :file=>download_file, :title=>title, :date=>date}
end

#_init_driver(selenium) ⇒ `Object`

driver初期化

# File 'lib/ameblogazo.rb', line 52

def _init_driver(selenium)
  if selenium
    @driver = SeleniumDriver.new
  else
    @driver = WebkitDriver.new
  end
end

#_next_page ⇒ `Object`

次にダウンロードするべき画像を開く



127
128
129

# File 'lib/ameblogazo.rb', line 127

def _next_page()
  @driver.find("#nextNavi").click
end

#_save_img(url, file) ⇒ `Object`

画像をダウンロードして保存

# File 'lib/ameblogazo.rb', line 132

def _save_img(url, file)
  open(url) do |doc|
    open(file, 'w') do |fp|
      fp.print doc.read
    end
  end
  filename = File.basename(file)
  puts "#{filename} を保存しました"
end

#fetch(options) ⇒ `Object`

画像を保存する :ameba_id => アメーバID :dir => 保存先ディレクトリ :categorize => タイトル毎などに分類する（デフォルト無効）[nil, “title”, “date”] :num => 取得する枚数（新しいものから順番に）

# File 'lib/ameblogazo.rb', line 147

def fetch(options)
  options = _check_options(options)
  ameba_id = options[:ameba_id]
  categorize = options[:categorize]
  dir = options[:dir]
  num = options[:num]
  
  # driver初期化
  _init_driver(options[:selenium])
  
  # 画像ページに移動
  @driver.visit(_find_image_url(ameba_id))
  
  # 最初にみつけた画像から次の画像へと順番にたどってく
  info_list = []
  loop.with_index do |_, i|
    break if i == num # 指定枚数で終了
    info = _get_info(dir, categorize)
    break if !info_list[0].nil? and info_list[0][:file] == info[:file]
    info_list.push(info)
    
    if File.exists?(info[:file])
      if num
        puts "既にダウンロードされている画像です"
      else
        puts "ダウンロード済みの画像が見つかったので終了します"
        break
      end
    else
      _save_img(info[:url], info[:file])
    end
    _next_page
    sleep(0.5)
  end
end

#info(options) ⇒ `Object`

画像の情報を取得する

# File 'lib/ameblogazo.rb', line 184

def info(options)
  options = _check_options(options)
  ameba_id = options[:ameba_id]
  categorize = options[:categorize]
  dir = options[:dir]
  num = options[:num]
  
  # driver初期化
  _init_driver(options[:selenium])
  
  # 画像ページに移動
  @driver.visit(_find_image_url(ameba_id))
  
  # 最初にみつけた画像から次の画像へと順番にたどってく
  info_list = []
  loop.with_index do |a, i|
    break if i == num # 指定枚数で終了
    info = _get_info(dir, categorize)
    break if !info_list[0].nil? and info_list[0][:file] == info[:file]
    info_list.push(info)
    _next_page
    sleep(0.5)
  end
  info_list
end

Class: Ameblogazo::Gazo

Defined Under Namespace

Instance Method Summary collapse

Instance Method Details

#_check_options(options) ⇒ Object

#_find_image_url(ameba_id) ⇒ Object

#_get_info(dir, categorize) ⇒ Object

#_init_driver(selenium) ⇒ Object

#_next_page ⇒ Object

#_save_img(url, file) ⇒ Object

#fetch(options) ⇒ Object

#info(options) ⇒ Object