Class: ESearchy::SocialEngines::JigSaw
- Inherits:
-
GenericEngine
- Object
- GenericEngine
- ESearchy::SocialEngines::JigSaw
- Defined in:
- lib/esearchy/SocialEngines/jigsaw.rb
Constant Summary collapse
- ENGINE =
"www.google.com"
- PORT =
80
- NUM =
100
- TYPE =
2
Instance Attribute Summary
Attributes inherited from GenericEngine
#documents, #emails, #people, #results
Instance Method Summary collapse
Methods inherited from GenericEngine
#company=, #initialize, #maxhits=, #start=
Constructor Details
This class inherits a constructor from ESearchy::GenericEngine
Instance Method Details
#crawl_people(text) ⇒ Object
27 28 29 30 31 32 33 34 35 |
# File 'lib/esearchy/SocialEngines/jigsaw.rb', line 27 def crawl_people(text) text.scan(/<a class="l" href="([0-9A-Za-z:\\\/?&=@+%.;"'()_-]+)" [\sonmousedown="return curwt(this, ']*[0-9A-Za-z:\\\/?&=@+%.;"'()_-]*[')"]*>([\w\s]*),/).each do |profile| pf = profile[0].to_s pf = pf.scan(/\/url\?q=([0-9A-Za-z:\\\/?=@+%.;"'()_-]+)&/).to_s if pf.match(/\/url\?q=/) p = profile[1].split(" ") @people << [ p, pf ] @results << [p, "P", pf, self.class.to_s.upcase, "N"] end end |
#parse(html) ⇒ Object
17 18 19 20 21 22 23 24 25 |
# File 'lib/esearchy/SocialEngines/jigsaw.rb', line 17 def parse( html ) #Results <b>1</b> - <b>8</b> of <b>8</b> from <b>www.google.com</b> hits = html.scan(/<\/b> of [\w\s]*<b>(.*)<\/b> from /) if hits.empty? or hits == nil @totalhits = 0 else @totalhits = totalhits(hits[0][0].gsub(",","").to_i) end end |
#search ⇒ Object
9 10 11 12 13 14 15 |
# File 'lib/esearchy/SocialEngines/jigsaw.rb', line 9 def search @querypath = "/cse?q=site:www.jigsaw.com/++%2B+#{CGI.escape(@company)}+%2B" + "+intitle:\"#{CGI.escape(@company)}\"" + "&hl=en&cof=&num=100&filter=0&safe=off&start=" or raise ESearchyMissingCompany, "Mssing website url Object.company=(value)" super end |