-
Notifications
You must be signed in to change notification settings - Fork 1.4k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
[201803] [services] Restart SwSS service upon unexpected critical pro…
…cess exit (#2546) * [service] Restart SwSS Docker container if orchagent exits unexpectedly * [dhcp_relay] Use STATE_DB to determine whether interfaces are ready * Supervisor now autorestarts rsyslogd upon unexpected exit * Add other critical processes to event listener * Make supervisor-proc-exit-listener script global, have it read from 'critical_processes' file inside container * Add SwSS to 'WantedBy=' option of services which should be started along with SwSS
- Loading branch information
Showing
19 changed files
with
127 additions
and
60 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,42 +1,40 @@ | ||
#!/usr/bin/env bash | ||
|
||
function wait_until_iface_ready | ||
{ | ||
IFACE=$1 | ||
STATE_DB_IDX="6" | ||
|
||
echo "Waiting until interface $IFACE is up..." | ||
|
||
# Wait for the interface to come up (i.e., 'ip link show' returns 0) | ||
until ip link show dev $IFACE up > /dev/null 2>&1; do | ||
sleep 1 | ||
done | ||
PORT_TABLE_PREFIX="PORT_TABLE" | ||
VLAN_TABLE_PREFIX="VLAN_TABLE" | ||
LAG_TABLE_PREFIX="LAG_TABLE" | ||
|
||
echo "Interface $IFACE is up" | ||
function wait_until_iface_ready | ||
{ | ||
TABLE_PREFIX=$1 | ||
IFACE=$2 | ||
|
||
echo "Waiting until interface $IFACE has an IPv4 address..." | ||
echo "Waiting until interface $IFACE is ready..." | ||
|
||
# Wait until the interface gets assigned an IPv4 address | ||
# Wait for the interface to come up | ||
# (i.e., interface is present in STATE_DB and state is "ok") | ||
while true; do | ||
IP=$(ip -4 addr show dev $IFACE | grep "inet " | awk '{ print $2 }' | cut -d '/' -f1) | ||
|
||
if [ -n "$IP" ]; then | ||
RESULT=$(redis-cli -n ${STATE_DB_IDX} HGET "${TABLE_PREFIX}|${IFACE}" "state" 2> /dev/null) | ||
if [ x"$RESULT" == x"ok" ]; then | ||
break | ||
fi | ||
|
||
sleep 1 | ||
done | ||
|
||
echo "Interface $IFACE is configured with IP $IP" | ||
echo "Interface ${IFACE} is ready!" | ||
} | ||
|
||
|
||
# Wait for all interfaces to come up and have IPv4 addresses assigned | ||
# Wait for all interfaces to be up and ready | ||
{% for (name, prefix) in INTERFACE %} | ||
wait_until_iface_ready {{ name }} | ||
wait_until_iface_ready ${PORT_TABLE_PREFIX} {{ name }} | ||
{% endfor %} | ||
{% for (name, prefix) in VLAN_INTERFACE %} | ||
wait_until_iface_ready {{ name }} | ||
wait_until_iface_ready ${VLAN_TABLE_PREFIX} {{ name }} | ||
{% endfor %} | ||
{% for (name, prefix) in PORTCHANNEL_INTERFACE %} | ||
wait_until_iface_ready {{ name }} | ||
wait_until_iface_ready ${LAG_TABLE_PREFIX} {{ name }} | ||
{% endfor %} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,7 @@ | ||
orchagent | ||
portsyncd | ||
intfsyncd | ||
neighsyncd | ||
vlanmgrd | ||
intfmgrd | ||
buffermgrd |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,45 @@ | ||
#!/usr/bin/env python | ||
|
||
import os | ||
import signal | ||
import sys | ||
import syslog | ||
|
||
from supervisor import childutils | ||
|
||
# Contents of file should be the names of critical processes (as defined in | ||
# supervisor.conf file), one per line | ||
CRITICAL_PROCESSES_FILE = '/etc/supervisor/critical_processes' | ||
|
||
def main(): | ||
# Read the list of critical processes from a file | ||
with open(CRITICAL_PROCESSES_FILE, 'r') as f: | ||
critical_processes = [line.rstrip('\n') for line in f] | ||
|
||
while True: | ||
# Transition from ACKNOWLEDGED to READY | ||
childutils.listener.ready() | ||
|
||
line = sys.stdin.readline() | ||
headers = childutils.get_headers(line) | ||
payload = sys.stdin.read(int(headers['len'])) | ||
|
||
# Transition from READY to ACKNOWLEDGED | ||
childutils.listener.ok() | ||
|
||
# We only care about PROCESS_STATE_EXITED events | ||
if headers['eventname'] == 'PROCESS_STATE_EXITED': | ||
payload_headers, payload_data = childutils.eventdata(payload + '\n') | ||
|
||
expected = int(payload_headers['expected']) | ||
processname = payload_headers['processname'] | ||
|
||
# If a critical process exited unexpectedly, terminate supervisor | ||
if expected == 0 and processname in critical_processes: | ||
MSG_FORMAT_STR = "Process {} exited unxepectedly. Terminating supervisor..." | ||
msg = MSG_FORMAT_STR.format(payload_headers['processname']) | ||
syslog.syslog(syslog.LOG_INFO, msg) | ||
os.kill(os.getppid(), signal.SIGTERM) | ||
|
||
if __name__ == "__main__": | ||
main() |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
50 changes: 24 additions & 26 deletions
50
src/sonic-config-engine/tests/sample_output/wait_for_intf.sh
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,43 +1,41 @@ | ||
#!/usr/bin/env bash | ||
|
||
function wait_until_iface_ready | ||
{ | ||
IFACE=$1 | ||
STATE_DB_IDX="6" | ||
|
||
echo "Waiting until interface $IFACE is up..." | ||
|
||
# Wait for the interface to come up (i.e., 'ip link show' returns 0) | ||
until ip link show dev $IFACE up > /dev/null 2>&1; do | ||
sleep 1 | ||
done | ||
PORT_TABLE_PREFIX="PORT_TABLE" | ||
VLAN_TABLE_PREFIX="VLAN_TABLE" | ||
LAG_TABLE_PREFIX="LAG_TABLE" | ||
|
||
echo "Interface $IFACE is up" | ||
function wait_until_iface_ready | ||
{ | ||
TABLE_PREFIX=$1 | ||
IFACE=$2 | ||
|
||
echo "Waiting until interface $IFACE has an IPv4 address..." | ||
echo "Waiting until interface $IFACE is ready..." | ||
|
||
# Wait until the interface gets assigned an IPv4 address | ||
# Wait for the interface to come up | ||
# (i.e., interface is present in STATE_DB and state is "ok") | ||
while true; do | ||
IP=$(ip -4 addr show dev $IFACE | grep "inet " | awk '{ print $2 }' | cut -d '/' -f1) | ||
|
||
if [ -n "$IP" ]; then | ||
RESULT=$(redis-cli -n ${STATE_DB_IDX} HGET "${TABLE_PREFIX}|${IFACE}" "state" 2> /dev/null) | ||
if [ x"$RESULT" == x"ok" ]; then | ||
break | ||
fi | ||
|
||
sleep 1 | ||
done | ||
|
||
echo "Interface $IFACE is configured with IP $IP" | ||
echo "Interface ${IFACE} is ready!" | ||
} | ||
|
||
|
||
# Wait for all interfaces to come up and have IPv4 addresses assigned | ||
wait_until_iface_ready Vlan1000 | ||
wait_until_iface_ready PortChannel04 | ||
wait_until_iface_ready PortChannel02 | ||
wait_until_iface_ready PortChannel03 | ||
wait_until_iface_ready PortChannel03 | ||
wait_until_iface_ready PortChannel01 | ||
wait_until_iface_ready PortChannel02 | ||
wait_until_iface_ready PortChannel04 | ||
wait_until_iface_ready PortChannel01 | ||
# Wait for all interfaces to be up and ready | ||
wait_until_iface_ready ${VLAN_TABLE_PREFIX} Vlan1000 | ||
wait_until_iface_ready ${LAG_TABLE_PREFIX} PortChannel04 | ||
wait_until_iface_ready ${LAG_TABLE_PREFIX} PortChannel02 | ||
wait_until_iface_ready ${LAG_TABLE_PREFIX} PortChannel03 | ||
wait_until_iface_ready ${LAG_TABLE_PREFIX} PortChannel03 | ||
wait_until_iface_ready ${LAG_TABLE_PREFIX} PortChannel01 | ||
wait_until_iface_ready ${LAG_TABLE_PREFIX} PortChannel02 | ||
wait_until_iface_ready ${LAG_TABLE_PREFIX} PortChannel04 | ||
wait_until_iface_ready ${LAG_TABLE_PREFIX} PortChannel01 | ||
|