summaryrefslogtreecommitdiffhomepage
path: root/test/test_respawn.py
blob: dc465cdaae2ca417894b92cda00c9d75134830fb (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
import re
import subprocess
import time

import pytest
from unit.applications.lang.python import ApplicationPython

prerequisites = {'modules': {'python': 'any'}}

client = ApplicationPython()

PATTERN_ROUTER = 'unit: router'
PATTERN_CONTROLLER = 'unit: controller'


@pytest.fixture(autouse=True)
def setup_method_fixture(temp_dir):
    client.app_name = f'app-{temp_dir.split("/")[-1]}'

    client.load('empty', client.app_name)

    assert 'success' in client.conf(
        '1', f'applications/{client.app_name}/processes'
    )


def pid_by_name(name, ppid):
    output = subprocess.check_output(['ps', 'ax', '-O', 'ppid']).decode()
    m = re.search(fr'\s*(\d+)\s*{ppid}.*{name}', output)
    return None if m is None else m.group(1)


def kill_pids(*pids):
    subprocess.call(['kill', '-9', *pids])


def wait_for_process(process, unit_pid):
    for _ in range(50):
        found = pid_by_name(process, unit_pid)

        if found is not None:
            break

        time.sleep(0.1)

    return found


def find_proc(name, ppid, ps_output):
    return re.findall(fr'{ppid}.*{name}', ps_output)


def smoke_test(unit_pid):
    for _ in range(10):
        r = client.conf('1', f'applications/{client.app_name}/processes')

        if 'success' in r:
            break

        time.sleep(0.1)

    assert 'success' in r
    assert client.get()['status'] == 200

    # Check if the only one router, controller,
    # and application processes running.

    out = subprocess.check_output(['ps', 'ax', '-O', 'ppid']).decode()
    assert len(find_proc(PATTERN_ROUTER, unit_pid, out)) == 1
    assert len(find_proc(PATTERN_CONTROLLER, unit_pid, out)) == 1
    assert len(find_proc(client.app_name, unit_pid, out)) == 1


def test_respawn_router(skip_alert, unit_pid, skip_fds_check):
    skip_fds_check(router=True)
    pid = pid_by_name(PATTERN_ROUTER, unit_pid)

    kill_pids(pid)
    skip_alert(fr'process {pid} exited on signal 9')

    assert wait_for_process(PATTERN_ROUTER, unit_pid) is not None

    smoke_test(unit_pid)


def test_respawn_controller(skip_alert, unit_pid, skip_fds_check):
    skip_fds_check(controller=True)
    pid = pid_by_name(PATTERN_CONTROLLER, unit_pid)

    kill_pids(pid)
    skip_alert(fr'process {pid} exited on signal 9')

    assert wait_for_process(PATTERN_CONTROLLER, unit_pid) is not None

    assert client.get()['status'] == 200

    smoke_test(unit_pid)


def test_respawn_application(skip_alert, unit_pid):
    pid = pid_by_name(client.app_name, unit_pid)

    kill_pids(pid)
    skip_alert(fr'process {pid} exited on signal 9')

    assert wait_for_process(client.app_name, unit_pid) is not None

    smoke_test(unit_pid)