Class: OatsAgent::Ragent
- Inherits:
-
EventMachine::Connection
- Object
- EventMachine::Connection
- OatsAgent::Ragent
- Includes:
- EM::P::ObjectProtocol
- Defined in:
- lib/oats_agent/ragent.rb
Constant Summary collapse
- @@logger =
nil
- @@oats_info_snapshot =
{}
- @@job_count =
1
- @@occ_default =
nil
Instance Attribute Summary collapse
-
#jid ⇒ Object
Returns the value of attribute jid.
-
#job_count ⇒ Object
Returns the value of attribute job_count.
-
#occ_reintroduction_wait_time ⇒ Object
Returns the value of attribute occ_reintroduction_wait_time.
-
#request ⇒ Object
readonly
Returns the value of attribute request.
Class Method Summary collapse
-
.in_next_job ⇒ Object
Non-nil if in the state of requesting for the next job.
- .in_next_job=(v) ⇒ Object
-
.is_busy ⇒ Object
Current/Last jobid worked on, or false.
- .is_busy=(jid) ⇒ Object
- .job_count ⇒ Object
-
.job_count=(val) ⇒ Object
def Ragent.force_close_connection end.
- .logger ⇒ Object
- .no_response(occv, ra, prev_jobid) ⇒ Object
-
.occ ⇒ Object
Contains YAML OCC entries if oats is started in agent mode.
- .server_logger(ra, arg) ⇒ Object
- .snapshot_oats_info(oats_info) ⇒ Object
- .start(occ_def) ⇒ Object
- .start_next_job(occ = @@occ_default, ra = nil, prev_jobid = nil) ⇒ Object
Instance Method Summary collapse
-
#get_oats_info ⇒ Object
Results_status: Early, Partial, Current, Archived, Missing, Error.
- #receive_object(request) ⇒ Object
-
#regen_results_summary!(oats_info) ⇒ Object
Generates summary data into the input oats_info.
- #run_next_job(prev_jobid = nil) ⇒ Object
- #server_logger(arg) ⇒ Object
- #unbind ⇒ Object
Instance Attribute Details
#jid ⇒ Object
Returns the value of attribute jid.
9 10 11 |
# File 'lib/oats_agent/ragent.rb', line 9 def jid @jid end |
#job_count ⇒ Object
Returns the value of attribute job_count.
9 10 11 |
# File 'lib/oats_agent/ragent.rb', line 9 def job_count @job_count end |
#occ_reintroduction_wait_time ⇒ Object
Returns the value of attribute occ_reintroduction_wait_time.
9 10 11 |
# File 'lib/oats_agent/ragent.rb', line 9 def occ_reintroduction_wait_time @occ_reintroduction_wait_time end |
#request ⇒ Object (readonly)
Returns the value of attribute request.
10 11 12 |
# File 'lib/oats_agent/ragent.rb', line 10 def request @request end |
Class Method Details
.in_next_job ⇒ Object
Non-nil if in the state of requesting for the next job
19 20 21 |
# File 'lib/oats_agent/ragent.rb', line 19 def Ragent.in_next_job @@in_next_job end |
.in_next_job=(v) ⇒ Object
22 23 24 |
# File 'lib/oats_agent/ragent.rb', line 22 def Ragent.in_next_job=(v) @@in_next_job = v end |
.is_busy ⇒ Object
Current/Last jobid worked on, or false
29 30 31 |
# File 'lib/oats_agent/ragent.rb', line 29 def Ragent.is_busy @@is_busy end |
.is_busy=(jid) ⇒ Object
25 26 27 |
# File 'lib/oats_agent/ragent.rb', line 25 def Ragent.is_busy=(jid) @@is_busy = jid end |
.job_count ⇒ Object
70 71 72 |
# File 'lib/oats_agent/ragent.rb', line 70 def Ragent.job_count @@job_count end |
.job_count=(val) ⇒ Object
def Ragent.force_close_connection
end
67 68 69 |
# File 'lib/oats_agent/ragent.rb', line 67 def Ragent.job_count=(val) @@job_count = val end |
.logger ⇒ Object
37 38 39 |
# File 'lib/oats_agent/ragent.rb', line 37 def Ragent.logger @@logger ||= Log4r::Logger.new('A') end |
.no_response(occv, ra, prev_jobid) ⇒ Object
286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 |
# File 'lib/oats_agent/ragent.rb', line 286 def self.no_response(occv,ra, prev_jobid) Ragent.in_next_job = false Ragent.server_logger ra, "OCC did not respond." wait = ra ? ra.occ_reintroduction_wait_time : @@occ_reintroduction_wait_time wait ||= $oats['execution']['occ']['timeout_waiting_for_occ'] # Keep retrying to introduce, doubling the intervals self.server_logger ra, "Will retry in #{wait} seconds." EM.add_timer(wait) do Ragent.start_next_job(occv,ra, prev_jobid) unless Ragent.is_busy # by now end wait *= (1.5 + rand(101)/100.0) wait = wait.round if ra ra.occ_reintroduction_wait_time = wait else @@occ_reintroduction_wait_time = wait end end |
.occ ⇒ Object
Contains YAML OCC entries if oats is started in agent mode
34 35 36 |
# File 'lib/oats_agent/ragent.rb', line 34 def Ragent.occ @@occ_default end |
.server_logger(ra, arg) ⇒ Object
309 310 311 312 313 314 315 316 317 318 319 |
# File 'lib/oats_agent/ragent.rb', line 309 def Ragent.server_logger(ra, arg) if ra req = ra.request jid = ra.jid rt = ":R#{(req and req[:id]) ? req[:id] : ra.object_id}" rt += "#{" J:#{jid}" if jid }" end @@logger.info "[RS#{rt}] #{arg}" rescue @@logger.error $!.inspect + "\n" + $!.backtrace.join("\n ") end |
.snapshot_oats_info(oats_info) ⇒ Object
74 75 76 |
# File 'lib/oats_agent/ragent.rb', line 74 def Ragent.snapshot_oats_info(oats_info) @@oats_info_snapshot = oats_info end |
.start(occ_def) ⇒ Object
41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 |
# File 'lib/oats_agent/ragent.rb', line 41 def Ragent.start(occ_def) @@occ_default = occ_def # This should not change during agent execution 3.times do |count| # In case of unexpected exceptions begin @@occ_reintroduction_wait_time = nil @@is_busy = false # If agent is started from scratch assume previous one is gone @@in_next_job = false @@logger.info "=====================================================================================" mach_port = ENV['HOSTNAME'] + ':' + $oats['execution']['occ']['port'].to_s @@logger.info "Started OATS Server execution-#{count} on #{mach_port} at #{Time.now} " EventMachine::run do EventMachine::start_server @@occ_default['agent_host'], @@occ_default['agent_port'].to_i, Ragent EventMachine.next_tick do Ragent.server_logger nil,'Initiating contact with OCC ' Ragent.start_next_job unless Ragent.is_busy end end break # Shutdown requested rescue Exception => exc @@logger.error exc end end end |
.start_next_job(occ = @@occ_default, ra = nil, prev_jobid = nil) ⇒ Object
200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 |
# File 'lib/oats_agent/ragent.rb', line 200 def self.start_next_job(occ = @@occ_default, ra = nil, prev_jobid = nil) if Ragent.in_next_job or Ragent.is_busy msg = if Ragent.in_next_job if Ragent.in_next_job == nil.object_id "already getting the initial job." else "already getting job for #{Ragent.in_next_job}]" end else "became busy with #{Ragent.is_busy}" end Ragent.server_logger ra, "Not requesting new job since #{msg}" return false end Ragent.in_next_job = ra.object_id # Double check that this agent has the busy lock if not Ragent.in_next_job or Ragent.in_next_job != ra.object_id Ragent.server_logger(ra, "Not requesting new job since " + "now another Ragent #{ra.object_id} is requesting next job besides current #{Ragent.in_next_job}") return false end query = { 'nickname' => occ['agent_nickname'], 'machine' => occ['agent_host'], 'port' => occ['agent_port'] } query['jobid'] = prev_jobid if prev_jobid query['repo'] = ENV['OATS_TESTS_CODE_VERSION'].to_s if ENV['OATS_TESTS_CODE_VERSION'] and ENV['OATS_TESTS_CODE_VERSION'] != '' query['logfile'] = File.basename(ENV['OATS_AGENT_LOGFILE']||'agent.log') Ragent.server_logger ra, "Getting next OCC job: " + query.inspect query['password='] = ra.request[:password] if ra and ra.request[:password] # Default inactivity_timeout of 10 is not enough when OCC is restarting too # many agents. Agent gives up in 10secs but OCC hands over the job in 20secs. # As a result OCC thinks job is received but agent has never seen the job. = { :connect_timeout => 60,:inactivity_timeout => 60} http_req = EventMachine::HttpRequest.new('http://' + occ['server_host'] + ":#{occ['server_port']}",) http = http_req.get :path => '/jobs/nxt', :query => query http.errback { self.no_response(occ,ra, prev_jobid) } http.callback do status = http.response_header.status if status == 200 data =http.response nxt_job = JSON.parse(data) if data if nxt_job['jid'] Ragent.is_busy = nxt_job['jid'] Ragent.in_next_job = false if ra ra.jid = nxt_job['jid'] ra.occ_reintroduction_wait_time = nil # Reset wait time to default if heard from OCC end Ragent.server_logger ra, "Job-#{Ragent.job_count} #{nxt_job.inspect}" EventMachine.defer do begin opts= {'execution:environments' => [nxt_job['env']], 'execution:test_files' => [nxt_job['list']] } opts['_:options'] = nxt_job['options'].split(',') if nxt_job['options'] and nxt_job['options'] != '' Ragent.snapshot_oats_info({}) Oats::Driver.start(nxt_job['jid'],opts) ensure Ragent.is_busy = false end Ragent.job_count += 1 if ra ra.run_next_job(nxt_job['jid'] ) else Ragent.start_next_job(occ,ra,nxt_job['jid']) end end else Ragent.in_next_job = false Ragent.server_logger ra, "No more pending jobs at OCC. Pausing processing.\n" Ragent.job_count = 1 Ragent.server_logger ra, "***********************************************************\n" end else self.no_response(occ,ra, prev_jobid) end end rescue RuntimeError => e. Ragent.in_next_job = false if e. == 'eventmachine not initialized: evma_connect_to_server' Ragent.server_logger ra, "Shutting down..." else Ragent.server_logger ra, $!.inspect + "\n" + $!.backtrace.join("\n ") end end |
Instance Method Details
#get_oats_info ⇒ Object
Results_status: Early, Partial, Current, Archived, Missing, Error
87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 |
# File 'lib/oats_agent/ragent.rb', line 87 def get_oats_info if @request[:jobid] == Ragent.is_busy # working on it now if @request[:jobid] == @@oats_info_snapshot['jobid'] # first test started processing if regen_results_summary!(@@oats_info_snapshot) # summary succeeded oats_info = Marshal.load(Marshal.dump(@@oats_info_snapshot)) oats_info['results_status'] = 'Partial' else server_logger "[ERROR] Can not regen_results_summary from the snapshot" oats_info = {'results_status' => 'Error'} end elsif @@oats_info_snapshot['jobid'] msg = "ERROR: Unexpected condition. Request jobid: #{@request[:jobid]} does not match stored job id: #{@@oats_info_snapshot['jobid']}" server_logger msg oats_info = { 'jobid' => @request[:jobid], 'results_status' => 'Error', 'error_message' => msg } else oats_info = Marshal.load(Marshal.dump(Oats.context)) oats_info['results_status'] = 'Early' oats_info['jobid'] = Ragent.is_busy end else # Search for request on disk in archive or results res_dir = File.join(Oats.result_archive_dir, @request[:jobid].to_s) results_file = File.join( res_dir,'results.dump') if File.readable?(results_file) # Archived ones should have summary oats_info = Oats::Report.oats_info_retrieve(results_file) oats_info['results_status'] = 'Archived' else # May have to regenerate the summary, in case test had died results_file = File.join( $oats['execution']['dir_results'], 'results.dump') if File.readable?(results_file) oats_info = Oats::Report.oats_info_retrieve(results_file) if regen_results_summary!(oats_info) and @request[:jobid] == oats_info['jobid'] oats_info['results_status'] = 'Current' else oats_info = {} unless oats_info.instance_of?(Hash) oats_info['debug_message'] = "request_jobid: #{@request[:jobid]}, current oats_info jobid: #{oats_info['jobid']}" oats_info['results_status'] = 'Missing' end else oats_info = { 'results_status' => 'Missing' , 'debug_message' => "No readable: #{results_file}" } end end end # Convert object to hash oats_info['test_files'] = oats_info['test_files'].testlist_hash if oats_info['test_files'] return oats_info rescue server_logger $!.inspect + "\n" + $!.backtrace.join("\n ") end |
#receive_object(request) ⇒ Object
136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 |
# File 'lib/oats_agent/ragent.rb', line 136 def receive_object(request) @request = request password = @request.delete(:password) server_logger "Received " + @request.inspect @request[:password] = password response = {} case @request[:command] when 'status' EventMachine.next_tick { run_next_job } unless Ragent.is_busy when 'start' if Ragent.is_busy server_logger "Not getting next job again because Ragent.is_busy: #{Ragent.is_busy}" else EventMachine.next_tick { run_next_job } end when 'results' begin response[:oats_info] = get_oats_info rescue server_logger $!.inspect + "\n" + $!.backtrace.join("\n ") end when 'run' # only called from oats client, not from OCC EventMachine.defer( proc { Oats::Driver.start(@request[:jobid], @request[:args]) } ) unless Ragent.is_busy when 'stop' # any further test execution for this jobid Oats.context['stop_oats'] = @request[:id] if @request[:stop_jobs].include?(Oats.context['jobid']) when 'shutdown' else response[:unknown_command] = true server_logger "Unknown command #{@request[:command]}" end response[:is_busy] = Ragent.is_busy stop_oats = Oats.context && Oats.context['stop_oats'] response[:is_signal_oats_to_stop] = stop_oats if stop_oats server_logger "Sending " + response.inspect response[:password] = password send_object(response) close_connection_after_writing rescue server_logger $!.inspect + "\n" + $!.backtrace.join("\n ") end |
#regen_results_summary!(oats_info) ⇒ Object
Generates summary data into the input oats_info
79 80 81 82 83 84 |
# File 'lib/oats_agent/ragent.rb', line 79 def regen_results_summary!(oats_info) return Oats::Report.results(oats_info['test_files'],true) rescue server_logger $!.inspect + "\n" + $!.backtrace.join("\n ") false end |
#run_next_job(prev_jobid = nil) ⇒ Object
192 193 194 195 196 197 198 |
# File 'lib/oats_agent/ragent.rb', line 192 def run_next_job(prev_jobid = nil) return unless @request[:occ_host] # Bad input or invoked via client, not occ occ = @@occ_default.clone occ['server_host'] = @request[:occ_host] occ['server_port'] = @request[:occ_port] Ragent.start_next_job(occ, self, prev_jobid) end |
#server_logger(arg) ⇒ Object
305 306 307 |
# File 'lib/oats_agent/ragent.rb', line 305 def server_logger(arg) Ragent.server_logger self, arg end |
#unbind ⇒ Object
185 186 187 188 189 190 |
# File 'lib/oats_agent/ragent.rb', line 185 def unbind if @request[:command] == 'shutdown' server_logger "Shutting down the server." EventMachine::stop_event_loop end end |