Neels Hofmeyr | dae3d3c | 2017-03-28 12:16:58 +0200 | [diff] [blame] | 1 | # osmo_gsm_tester: process management |
| 2 | # |
| 3 | # Copyright (C) 2016-2017 by sysmocom - s.f.m.c. GmbH |
| 4 | # |
| 5 | # Author: Neels Hofmeyr <neels@hofmeyr.de> |
| 6 | # |
| 7 | # This program is free software: you can redistribute it and/or modify |
Harald Welte | 2720534 | 2017-06-03 09:51:45 +0200 | [diff] [blame] | 8 | # it under the terms of the GNU General Public License as |
Neels Hofmeyr | dae3d3c | 2017-03-28 12:16:58 +0200 | [diff] [blame] | 9 | # published by the Free Software Foundation, either version 3 of the |
| 10 | # License, or (at your option) any later version. |
| 11 | # |
| 12 | # This program is distributed in the hope that it will be useful, |
| 13 | # but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 14 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
Harald Welte | 2720534 | 2017-06-03 09:51:45 +0200 | [diff] [blame] | 15 | # GNU General Public License for more details. |
Neels Hofmeyr | dae3d3c | 2017-03-28 12:16:58 +0200 | [diff] [blame] | 16 | # |
Harald Welte | 2720534 | 2017-06-03 09:51:45 +0200 | [diff] [blame] | 17 | # You should have received a copy of the GNU General Public License |
Neels Hofmeyr | dae3d3c | 2017-03-28 12:16:58 +0200 | [diff] [blame] | 18 | # along with this program. If not, see <http://www.gnu.org/licenses/>. |
| 19 | |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 20 | import os |
| 21 | import time |
| 22 | import subprocess |
| 23 | import signal |
Pau Espin Pedrol | 0d8deec | 2017-06-23 11:43:38 +0200 | [diff] [blame] | 24 | from datetime import datetime |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 25 | |
Pau Espin Pedrol | 9a4631c | 2018-03-28 19:17:34 +0200 | [diff] [blame] | 26 | from . import log |
| 27 | from .event_loop import MainLoop |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 28 | from .util import Dir |
| 29 | |
| 30 | class Process(log.Origin): |
| 31 | |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 32 | def __init__(self, name, run_dir, popen_args, **popen_kwargs): |
Neels Hofmeyr | 1a7a3f0 | 2017-06-10 01:18:27 +0200 | [diff] [blame] | 33 | super().__init__(log.C_RUN, name) |
Pau Espin Pedrol | 5860367 | 2018-08-09 13:45:55 +0200 | [diff] [blame] | 34 | self.process_obj = None |
| 35 | self.result = None |
| 36 | self.killed = None |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 37 | self.name_str = name |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 38 | self.run_dir = run_dir |
| 39 | self.popen_args = popen_args |
| 40 | self.popen_kwargs = popen_kwargs |
| 41 | self.outputs = {} |
| 42 | if not isinstance(self.run_dir, Dir): |
| 43 | self.run_dir = Dir(os.path.abspath(str(self.run_dir))) |
| 44 | |
| 45 | def set_env(self, key, value): |
| 46 | env = self.popen_kwargs.get('env') or {} |
| 47 | env[key] = value |
| 48 | self.popen_kwargs['env'] = env |
| 49 | |
| 50 | def make_output_log(self, name): |
| 51 | ''' |
| 52 | create a non-existing log output file in run_dir to pipe stdout and |
| 53 | stderr from this process to. |
| 54 | ''' |
| 55 | path = self.run_dir.new_child(name) |
| 56 | f = open(path, 'w') |
| 57 | self.dbg(path) |
Pau Espin Pedrol | 0d8deec | 2017-06-23 11:43:38 +0200 | [diff] [blame] | 58 | f.write('(launched: %s)\n' % datetime.now().strftime(log.LONG_DATEFMT)) |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 59 | f.flush() |
| 60 | self.outputs[name] = (path, f) |
| 61 | return f |
| 62 | |
| 63 | def launch(self): |
Neels Hofmeyr | 1a7a3f0 | 2017-06-10 01:18:27 +0200 | [diff] [blame] | 64 | log.dbg('cd %r; %s %s' % ( |
| 65 | os.path.abspath(str(self.run_dir)), |
| 66 | ' '.join(['%s=%r'%(k,v) for k,v in self.popen_kwargs.get('env', {}).items()]), |
| 67 | ' '.join(self.popen_args))) |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 68 | |
Neels Hofmeyr | 1a7a3f0 | 2017-06-10 01:18:27 +0200 | [diff] [blame] | 69 | self.process_obj = subprocess.Popen( |
| 70 | self.popen_args, |
| 71 | stdout=self.make_output_log('stdout'), |
| 72 | stderr=self.make_output_log('stderr'), |
| 73 | stdin=subprocess.PIPE, |
| 74 | shell=False, |
| 75 | cwd=self.run_dir.path, |
| 76 | **self.popen_kwargs) |
| 77 | self.set_name(self.name_str, pid=self.process_obj.pid) |
| 78 | self.log('Launched') |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 79 | |
Pau Espin Pedrol | b1526b9 | 2018-05-22 20:32:30 +0200 | [diff] [blame] | 80 | def respawn(self): |
| 81 | self.dbg('respawn') |
| 82 | assert not self.is_running() |
| 83 | self.result = None |
| 84 | self.killed = None |
| 85 | self.launch() |
| 86 | |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 87 | def _poll_termination(self, time_to_wait_for_term=5): |
| 88 | wait_step = 0.001 |
| 89 | waited_time = 0 |
| 90 | while True: |
| 91 | # poll returns None if proc is still running |
| 92 | self.result = self.process_obj.poll() |
| 93 | if self.result is not None: |
| 94 | return True |
| 95 | waited_time += wait_step |
| 96 | # make wait_step approach 1.0 |
| 97 | wait_step = (1. + 5. * wait_step) / 6. |
| 98 | if waited_time >= time_to_wait_for_term: |
| 99 | break |
| 100 | time.sleep(wait_step) |
| 101 | return False |
| 102 | |
| 103 | def terminate(self): |
| 104 | if self.process_obj is None: |
| 105 | return |
| 106 | if self.result is not None: |
| 107 | return |
| 108 | |
| 109 | while True: |
| 110 | # first try SIGINT to allow stdout+stderr flushing |
| 111 | self.log('Terminating (SIGINT)') |
| 112 | os.kill(self.process_obj.pid, signal.SIGINT) |
| 113 | self.killed = signal.SIGINT |
| 114 | if self._poll_termination(): |
| 115 | break |
| 116 | |
| 117 | # SIGTERM maybe? |
| 118 | self.log('Terminating (SIGTERM)') |
| 119 | self.process_obj.terminate() |
| 120 | self.killed = signal.SIGTERM |
| 121 | if self._poll_termination(): |
| 122 | break |
| 123 | |
| 124 | # out of patience |
| 125 | self.log('Terminating (SIGKILL)') |
| 126 | self.process_obj.kill() |
| 127 | self.killed = signal.SIGKILL |
| 128 | break; |
| 129 | |
| 130 | self.process_obj.wait() |
| 131 | self.cleanup() |
| 132 | |
| 133 | def cleanup(self): |
Pau Espin Pedrol | 06ada45 | 2018-05-22 19:20:41 +0200 | [diff] [blame] | 134 | self.dbg('Cleanup') |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 135 | self.close_output_logs() |
| 136 | if self.result == 0: |
| 137 | self.log('Terminated: ok', rc=self.result) |
| 138 | elif self.killed: |
| 139 | self.log('Terminated', rc=self.result) |
| 140 | else: |
| 141 | self.err('Terminated: ERROR', rc=self.result) |
Neels Hofmeyr | 85eb324 | 2017-04-09 22:01:16 +0200 | [diff] [blame] | 142 | #self.log_stdout_tail() |
| 143 | self.log_stderr_tail() |
| 144 | |
| 145 | def log_stdout_tail(self): |
| 146 | m = self.get_stdout_tail(prefix='| ') |
| 147 | if not m: |
| 148 | return |
| 149 | self.log('stdout:\n', m, '\n') |
| 150 | |
| 151 | def log_stderr_tail(self): |
| 152 | m = self.get_stderr_tail(prefix='| ') |
| 153 | if not m: |
| 154 | return |
| 155 | self.log('stderr:\n', m, '\n') |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 156 | |
| 157 | def close_output_logs(self): |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 158 | for k, v in self.outputs.items(): |
| 159 | path, f = v |
| 160 | if f: |
| 161 | f.flush() |
| 162 | f.close() |
| 163 | self.outputs[k] = (path, None) |
| 164 | |
| 165 | def poll(self): |
| 166 | if self.process_obj is None: |
| 167 | return |
| 168 | if self.result is not None: |
| 169 | return |
| 170 | self.result = self.process_obj.poll() |
| 171 | if self.result is not None: |
| 172 | self.cleanup() |
| 173 | |
Neels Hofmeyr | 5356d0a | 2017-04-10 03:45:30 +0200 | [diff] [blame] | 174 | def is_running(self, poll_first=True): |
| 175 | if poll_first: |
| 176 | self.poll() |
Neels Hofmeyr | 85eb324 | 2017-04-09 22:01:16 +0200 | [diff] [blame] | 177 | return self.process_obj is not None and self.result is None |
| 178 | |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 179 | def get_output(self, which): |
| 180 | v = self.outputs.get(which) |
| 181 | if not v: |
| 182 | return None |
| 183 | path, f = v |
| 184 | with open(path, 'r') as f2: |
| 185 | return f2.read() |
| 186 | |
| 187 | def get_output_tail(self, which, tail=10, prefix=''): |
Neels Hofmeyr | 5356d0a | 2017-04-10 03:45:30 +0200 | [diff] [blame] | 188 | out = self.get_output(which) |
| 189 | if not out: |
| 190 | return None |
| 191 | out = out.splitlines() |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 192 | tail = min(len(out), tail) |
Neels Hofmeyr | 5356d0a | 2017-04-10 03:45:30 +0200 | [diff] [blame] | 193 | return prefix + ('\n' + prefix).join(out[-tail:]) |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 194 | |
| 195 | def get_stdout(self): |
| 196 | return self.get_output('stdout') |
| 197 | |
| 198 | def get_stderr(self): |
| 199 | return self.get_output('stderr') |
| 200 | |
| 201 | def get_stdout_tail(self, tail=10, prefix=''): |
| 202 | return self.get_output_tail('stdout', tail, prefix) |
| 203 | |
| 204 | def get_stderr_tail(self, tail=10, prefix=''): |
| 205 | return self.get_output_tail('stderr', tail, prefix) |
| 206 | |
Neels Hofmeyr | 5356d0a | 2017-04-10 03:45:30 +0200 | [diff] [blame] | 207 | def terminated(self, poll_first=True): |
| 208 | if poll_first: |
| 209 | self.poll() |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 210 | return self.result is not None |
| 211 | |
Neels Hofmeyr | 5356d0a | 2017-04-10 03:45:30 +0200 | [diff] [blame] | 212 | def wait(self, timeout=300): |
Pau Espin Pedrol | 9a4631c | 2018-03-28 19:17:34 +0200 | [diff] [blame] | 213 | MainLoop.wait(self, self.terminated, timeout=timeout) |
Neels Hofmeyr | dae3d3c | 2017-03-28 12:16:58 +0200 | [diff] [blame] | 214 | |
| 215 | |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 216 | class RemoteProcess(Process): |
| 217 | |
Pau Espin Pedrol | 3895fec | 2017-04-28 16:13:03 +0200 | [diff] [blame] | 218 | def __init__(self, name, run_dir, remote_user, remote_host, remote_cwd, popen_args, **popen_kwargs): |
Neels Hofmeyr | 5356d0a | 2017-04-10 03:45:30 +0200 | [diff] [blame] | 219 | super().__init__(name, run_dir, popen_args, **popen_kwargs) |
Pau Espin Pedrol | 3895fec | 2017-04-28 16:13:03 +0200 | [diff] [blame] | 220 | self.remote_user = remote_user |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 221 | self.remote_host = remote_host |
| 222 | self.remote_cwd = remote_cwd |
| 223 | |
| 224 | # hacky: instead of just prepending ssh, i.e. piping stdout and stderr |
| 225 | # over the ssh link, we should probably run on the remote side, |
| 226 | # monitoring the process remotely. |
Neels Hofmeyr | 5356d0a | 2017-04-10 03:45:30 +0200 | [diff] [blame] | 227 | if self.remote_cwd: |
| 228 | cd = 'cd "%s"; ' % self.remote_cwd |
| 229 | else: |
| 230 | cd = '' |
Pau Espin Pedrol | 3895fec | 2017-04-28 16:13:03 +0200 | [diff] [blame] | 231 | self.popen_args = ['ssh', self.remote_user+'@'+self.remote_host, |
Neels Hofmeyr | 5356d0a | 2017-04-10 03:45:30 +0200 | [diff] [blame] | 232 | '%s%s' % (cd, |
| 233 | ' '.join(self.popen_args))] |
Neels Hofmeyr | 3531a19 | 2017-03-28 14:30:28 +0200 | [diff] [blame] | 234 | self.dbg(self.popen_args, dir=self.run_dir, conf=self.popen_kwargs) |
Neels Hofmeyr | dae3d3c | 2017-03-28 12:16:58 +0200 | [diff] [blame] | 235 | |
Pau Espin Pedrol | e4358a9 | 2018-10-01 11:27:55 +0200 | [diff] [blame] | 236 | |
| 237 | def run_local_sync(run_dir, name, popen_args): |
| 238 | run_dir =run_dir.new_dir(name) |
| 239 | proc = Process(name, run_dir, popen_args) |
| 240 | proc.launch() |
| 241 | proc.wait() |
| 242 | if proc.result != 0: |
| 243 | log.ctx(proc) |
| 244 | raise log.Error('Exited in error') |
| 245 | |
| 246 | def run_remote_sync(run_dir, remote_user, remote_addr, name, popen_args, remote_cwd=None): |
| 247 | run_dir = run_dir.new_dir(name) |
| 248 | proc = RemoteProcess(name, run_dir, remote_user, remote_addr, remote_cwd, |
| 249 | popen_args) |
| 250 | proc.launch() |
| 251 | proc.wait() |
| 252 | if proc.result != 0: |
| 253 | log.ctx(proc) |
| 254 | raise log.Error('Exited in error') |
| 255 | |
| 256 | def scp(run_dir, remote_user, remote_addr, name, local_path, remote_path): |
| 257 | run_local_sync(run_dir, name, ('scp', '-r', local_path, '%s@%s:%s' % (remote_user, remote_addr, remote_path))) |
| 258 | |
| 259 | def copy_inst_ssh(run_dir, inst, remote_dir, remote_user, remote_addr, remote_rundir_append, cfg_file_name): |
| 260 | remote_inst = Dir(remote_dir.child(os.path.basename(str(inst)))) |
| 261 | remote_dir_str = str(remote_dir) |
| 262 | run_remote_sync(run_dir, remote_user, remote_addr, 'rm-remote-dir', ('test', '!', '-d', remote_dir_str, '||', 'rm', '-rf', remote_dir_str)) |
| 263 | run_remote_sync(run_dir, remote_user, remote_addr, 'mk-remote-dir', ('mkdir', '-p', remote_dir_str)) |
| 264 | scp(run_dir, remote_user, remote_addr, 'scp-inst-to-remote', str(inst), remote_dir_str) |
| 265 | |
| 266 | remote_run_dir = remote_dir.child(remote_rundir_append) |
| 267 | run_remote_sync(run_dir, remote_user, remote_addr, 'mk-remote-run-dir', ('mkdir', '-p', remote_run_dir)) |
| 268 | |
| 269 | remote_config_file = remote_dir.child(os.path.basename(cfg_file_name)) |
| 270 | scp(run_dir, remote_user, remote_addr, 'scp-cfg-to-remote', cfg_file_name, remote_config_file) |
| 271 | return remote_inst |
| 272 | |
Neels Hofmeyr | dae3d3c | 2017-03-28 12:16:58 +0200 | [diff] [blame] | 273 | # vim: expandtab tabstop=4 shiftwidth=4 |