Class: MultiprocessQueueClient

Inherits:
GHTorrent::Command show all
Includes:
GHTorrent::Logging, GHTorrent::Settings
Defined in:
lib/ghtorrent/multiprocess_queue_client.rb

Direct Known Subclasses

GHTRetrieveRepos

Constant Summary

Constants included from GHTorrent::Logging

GHTorrent::Logging::DEBUG_LEVEL

Constants included from GHTorrent::Settings

GHTorrent::Settings::CONFIGKEYS, GHTorrent::Settings::DEFAULTS

Instance Method Summary collapse

Methods included from GHTorrent::Logging

#debug, #info, #warn

Methods included from GHTorrent::Settings

#config, #merge, #merge_config_values, #override_config, #settings

Methods included from GHTorrent::Utils

included, #read_value, #user_type, #write_value

Methods inherited from GHTorrent::Command

#command_name, #override_config, #process_options, #queue_client, run, #version

Instance Method Details

#clazzObject



6
7
8
# File 'lib/ghtorrent/multiprocess_queue_client.rb', line 6

def clazz
  raise('Unimplemented')
end

#goObject



46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
# File 'lib/ghtorrent/multiprocess_queue_client.rb', line 46

def go

  configs = File.open(ARGV[0]).readlines.map do |line|
    next if line =~ /^#/
    case line.strip.split(/ /)[0]
      when 'U'
        type, ip, name, passwd, instances = line.strip.split(/ /)
      when 'T'
        type, ip, token, instances = line.strip.split(/ /)
    end

    (1..instances.to_i).map do |i|
      newcfg = self.settings.clone
      newcfg = override_config(newcfg, :attach_ip, ip)

      case type
        when 'U'
          newcfg = override_config(newcfg, :github_username, name)
          newcfg = override_config(newcfg, :github_passwd, passwd)
        when 'T'
          newcfg = override_config(newcfg, :github_token, token)
      end

      newcfg = override_config(newcfg, :mirror_history_pages_back, 100000)
      newcfg
    end
  end.flatten.select { |x| !x.nil? }

  children = configs.map do |config|
    pid = Process::fork

    if pid.nil?
      retriever = clazz.new(config, options[:queue])

      Signal.trap('TERM') {
        retriever.stop
      }

      retriever.run(self)
      exit
    else
      debug "Parent #{Process.pid} forked child #{pid}"
      pid
    end
  end

  debug 'Waiting for children'
  begin
    children.each do |pid|
      debug "Waiting for child #{pid}"
      Process.waitpid(pid, 0)
      debug "Child #{pid} exited"
    end
  rescue Interrupt
    debug 'Stopping'
  end
end

#loggerObject



36
37
38
39
# File 'lib/ghtorrent/multiprocess_queue_client.rb', line 36

def logger
  @logger ||= Logger.new(STDOUT)
  @logger
end

#prepare_options(options) ⇒ Object



10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
# File 'lib/ghtorrent/multiprocess_queue_client.rb', line 10

def prepare_options(options)
  options.banner <<-BANNER
Retrieve data for multiple repos in parallel. To work, it requires
a mapping file formatted as either of the follow formats:

U IP UNAME PASSWD NUM_PROCS
T IP TOKEN NUM_PROCS

{U,T}: U signifies that a username/password pair is provided, T that an OAuth
     token is specified instead
IP: address to use for outgoing requests (use 0.0.0.0 on non-multihomed hosts)
UNAME: Github user name to use for outgoing requests
PASSWD: Github password to use for outgoing requests
TOKEN: Github OAuth token
NUM_PROCS: Number of processes to spawn for this IP/UNAME combination

Values in the config.yaml file set with the -c command are overridden.

#{command_name} [options] mapping-file

  BANNER
  options.opt :queue, 'Queue to retrieve project names from',
              :short => 'q', :default => 'multiprocess-queue-client',
              :type => :string
end

#validateObject



41
42
43
44
# File 'lib/ghtorrent/multiprocess_queue_client.rb', line 41

def validate
  super
  Trollop::die 'Argument mapping-file is required' unless not args[0].nil?
end