Class: Sitemap

Inherits:
Object
  • Object
show all
Defined in:
lib/sitemap.rb

Instance Method Summary collapse

Constructor Details

#initialize(uri) ⇒ Sitemap

Returns a new instance of Sitemap.



6
7
8
# File 'lib/sitemap.rb', line 6

def initialize(uri)
  @uri = uri
end

Instance Method Details

#each(&block) ⇒ Object



10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
# File 'lib/sitemap.rb', line 10

def each(&block)
  sitemap = open(@uri) do |f|
    f = Zlib::GzipReader.new(f) if @uri =~ /\.gz\Z/
    Nokogiri::XML(f)
  end

  case sitemap.root.name
  when "urlset"
    sitemap.xpath("/s:urlset/s:url/s:loc", namespaces).each do |element|
      yield element.text
    end
  when "sitemapindex"
    sitemap.xpath("/s:sitemapindex/s:sitemap/s:loc", namespaces).each do |element|
      Sitemap.new(element.text).each(&block)
    end
  else
    raise "Unknown sitemap format"
  end
end

#namespacesObject



30
31
32
# File 'lib/sitemap.rb', line 30

def namespaces
  { "s" => "http://www.sitemaps.org/schemas/sitemap/0.9" }
end