[Services] Restart NAT service upon unexpected critical process exit. (#4208)
This commit is contained in:
parent
09c0563692
commit
64a6989d02
@ -38,6 +38,8 @@ RUN apt-get update \
|
|||||||
COPY ["start.sh", "/usr/bin/"]
|
COPY ["start.sh", "/usr/bin/"]
|
||||||
COPY ["supervisord.conf", "/etc/supervisor/conf.d/"]
|
COPY ["supervisord.conf", "/etc/supervisor/conf.d/"]
|
||||||
COPY ["restore_nat_entries.py", "/usr/bin/"]
|
COPY ["restore_nat_entries.py", "/usr/bin/"]
|
||||||
|
COPY ["files/supervisor-proc-exit-listener", "/usr/bin"]
|
||||||
|
COPY ["critical_processes", "/etc/supervisor"]
|
||||||
|
|
||||||
RUN apt-get clean -y; apt-get autoclean -y; apt-get autoremove -y
|
RUN apt-get clean -y; apt-get autoclean -y; apt-get autoremove -y
|
||||||
RUN rm -rf /debs
|
RUN rm -rf /debs
|
||||||
|
2
dockers/docker-nat/critical_processes
Normal file
2
dockers/docker-nat/critical_processes
Normal file
@ -0,0 +1,2 @@
|
|||||||
|
natmgrd
|
||||||
|
natsyncd
|
@ -3,6 +3,12 @@ logfile_maxbytes=1MB
|
|||||||
logfile_backups=2
|
logfile_backups=2
|
||||||
nodaemon=true
|
nodaemon=true
|
||||||
|
|
||||||
|
[eventlistener:supervisor-proc-exit-listener]
|
||||||
|
command=/usr/bin/supervisor-proc-exit-listener --container-name nat
|
||||||
|
events=PROCESS_STATE_EXITED
|
||||||
|
autostart=true
|
||||||
|
autorestart=unexpected
|
||||||
|
|
||||||
[program:start.sh]
|
[program:start.sh]
|
||||||
command=/usr/bin/start.sh
|
command=/usr/bin/start.sh
|
||||||
priority=1
|
priority=1
|
||||||
@ -15,7 +21,7 @@ stderr_logfile=syslog
|
|||||||
command=/usr/sbin/rsyslogd -n
|
command=/usr/sbin/rsyslogd -n
|
||||||
priority=2
|
priority=2
|
||||||
autostart=false
|
autostart=false
|
||||||
autorestart=false
|
autorestart=unexpected
|
||||||
stdout_logfile=syslog
|
stdout_logfile=syslog
|
||||||
stderr_logfile=syslog
|
stderr_logfile=syslog
|
||||||
|
|
||||||
|
@ -3,12 +3,16 @@ Description=NAT container
|
|||||||
Requires=updategraph.service swss.service
|
Requires=updategraph.service swss.service
|
||||||
After=updategraph.service swss.service syncd.service
|
After=updategraph.service swss.service syncd.service
|
||||||
Before=ntp-config.service
|
Before=ntp-config.service
|
||||||
|
StartLimitIntervalSec=1200
|
||||||
|
StartLimitBurst=3
|
||||||
|
|
||||||
[Service]
|
[Service]
|
||||||
User={{ sonicadmin_user }}
|
User={{ sonicadmin_user }}
|
||||||
ExecStartPre=/usr/bin/{{docker_container_name}}.sh start
|
ExecStartPre=/usr/bin/{{docker_container_name}}.sh start
|
||||||
ExecStart=/usr/bin/{{docker_container_name}}.sh wait
|
ExecStart=/usr/bin/{{docker_container_name}}.sh wait
|
||||||
ExecStop=/usr/bin/{{docker_container_name}}.sh stop
|
ExecStop=/usr/bin/{{docker_container_name}}.sh stop
|
||||||
|
Restart=always
|
||||||
|
RestartSec=30
|
||||||
|
|
||||||
[Install]
|
[Install]
|
||||||
WantedBy=multi-user.target swss.service
|
WantedBy=multi-user.target swss.service
|
||||||
|
@ -30,5 +30,6 @@ $(DOCKER_NAT)_RUN_OPT += --privileged -t
|
|||||||
$(DOCKER_NAT)_RUN_OPT += -v /etc/sonic:/etc/sonic:ro
|
$(DOCKER_NAT)_RUN_OPT += -v /etc/sonic:/etc/sonic:ro
|
||||||
$(DOCKER_NAT)_RUN_OPT += -v /host/warmboot:/var/warmboot
|
$(DOCKER_NAT)_RUN_OPT += -v /host/warmboot:/var/warmboot
|
||||||
|
|
||||||
$(DOCKER_NAT)_BASE_IMAGE_FILES += natctl:/usr/bin/natctl
|
$(DOCKER_NAT)_FILES += $(SUPERVISOR_PROC_EXIT_LISTENER_SCRIPT)
|
||||||
|
|
||||||
|
$(DOCKER_NAT)_BASE_IMAGE_FILES += natctl:/usr/bin/natctl
|
||||||
|
Reference in New Issue
Block a user