Restart IR and Storage on failures

Removing useless container health checks and just making IR and Storage nodes to
restart on failure. NeoFS daemons should do all they can to survive.

Signed-off-by: Stanislav Bogatyrev <stanislav@nspcc.ru>
This commit is contained in:
Stanislav Bogatyrev 2020-09-24 13:48:42 +03:00
parent 7d8fbc7754
commit a4cb92016f
4 changed files with 12 additions and 25 deletions

View file

@ -11,11 +11,6 @@ services:
chain_int: chain_int:
internet: internet:
ipv4_address: ${IPV4_PREFIX}.50 ipv4_address: ${IPV4_PREFIX}.50
healthcheck:
interval: 5s
retries: 15
test: ['CMD', 'sh', '-c', 'echo | nc 127.0.0.1 30333']
timeout: 10s
stop_signal: SIGKILL stop_signal: SIGKILL
environment: environment:
- ACC=/chain.gz - ACC=/chain.gz
@ -25,13 +20,6 @@ services:
- ./node-wallet.json:/wallets/node-wallet.json - ./node-wallet.json:/wallets/node-wallet.json
- ./../../vendor/hosts:/etc/hosts - ./../../vendor/hosts:/etc/hosts
neofs_main_chain-healthy:
image: alpine
container_name: neofs_main_chain-healthy
depends_on:
neofs_main_chain:
condition: service_healthy
networks: networks:
chain_int: chain_int:
internet: internet:

View file

@ -2,11 +2,13 @@
version: "2.4" version: "2.4"
services: services:
ir01: ir01:
image: ${IR_IMAGE}:${IR_VERSION} image: ${IR_IMAGE}:${IR_VERSION}
domainname: ${LOCAL_DOMAIN} domainname: ${LOCAL_DOMAIN}
hostname: ir01 hostname: ir01
container_name: ir01 container_name: ir01
restart: on-failure
networks: networks:
ir_int: ir_int:
internet: internet:
@ -24,6 +26,7 @@ services:
domainname: ${LOCAL_DOMAIN} domainname: ${LOCAL_DOMAIN}
hostname: ir02 hostname: ir02
container_name: ir02 container_name: ir02
restart: on-failure
networks: networks:
ir_int: ir_int:
internet: internet:
@ -41,6 +44,7 @@ services:
domainname: ${LOCAL_DOMAIN} domainname: ${LOCAL_DOMAIN}
hostname: ir03 hostname: ir03
container_name: ir03 container_name: ir03
restart: on-failure
networks: networks:
ir_int: ir_int:
internet: internet:
@ -58,6 +62,7 @@ services:
domainname: ${LOCAL_DOMAIN} domainname: ${LOCAL_DOMAIN}
hostname: ir04 hostname: ir04
container_name: ir04 container_name: ir04
restart: on-failure
networks: networks:
ir_int: ir_int:
internet: internet:
@ -75,6 +80,7 @@ services:
domainname: ${LOCAL_DOMAIN} domainname: ${LOCAL_DOMAIN}
hostname: ir05 hostname: ir05
container_name: ir05 container_name: ir05
restart: on-failure
networks: networks:
ir_int: ir_int:
internet: internet:
@ -92,6 +98,7 @@ services:
domainname: ${LOCAL_DOMAIN} domainname: ${LOCAL_DOMAIN}
hostname: ir06 hostname: ir06
container_name: ir06 container_name: ir06
restart: on-failure
networks: networks:
ir_int: ir_int:
internet: internet:
@ -109,6 +116,7 @@ services:
domainname: ${LOCAL_DOMAIN} domainname: ${LOCAL_DOMAIN}
hostname: ir07 hostname: ir07
container_name: ir07 container_name: ir07
restart: on-failure
networks: networks:
ir_int: ir_int:
internet: internet:

View file

@ -11,11 +11,6 @@ services:
chain_int: chain_int:
internet: internet:
ipv4_address: ${IPV4_PREFIX}.90 ipv4_address: ${IPV4_PREFIX}.90
healthcheck:
interval: 5s
retries: 15
test: ['CMD', 'sh', '-c', 'echo | nc 127.0.0.1 30333']
timeout: 10s
stop_signal: SIGKILL stop_signal: SIGKILL
environment: environment:
- ACC=/morph_chain.gz - ACC=/morph_chain.gz
@ -25,13 +20,6 @@ services:
- ./node-wallet.json:/wallets/node-wallet.json - ./node-wallet.json:/wallets/node-wallet.json
- ./../../vendor/hosts:/etc/hosts - ./../../vendor/hosts:/etc/hosts
neofs_morph_chain-healthy:
image: alpine
container_name: neofs_morph_chain-healthy
depends_on:
neofs_morph_chain:
condition: service_healthy
networks: networks:
chain_int: chain_int:
internet: internet:

View file

@ -7,6 +7,7 @@ services:
domainname: ${LOCAL_DOMAIN} domainname: ${LOCAL_DOMAIN}
hostname: s01 hostname: s01
container_name: s01 container_name: s01
restart: on-failure
networks: networks:
storage_int: storage_int:
internet: internet:
@ -26,7 +27,7 @@ services:
domainname: ${LOCAL_DOMAIN} domainname: ${LOCAL_DOMAIN}
hostname: s02 hostname: s02
container_name: s02 container_name: s02
container_name: s02 restart: on-failure
networks: networks:
storage_int: storage_int:
internet: internet:
@ -46,6 +47,7 @@ services:
domainname: ${LOCAL_DOMAIN} domainname: ${LOCAL_DOMAIN}
hostname: s03 hostname: s03
container_name: s03 container_name: s03
restart: on-failure
networks: networks:
storage_int: storage_int:
internet: internet:
@ -65,6 +67,7 @@ services:
domainname: ${LOCAL_DOMAIN} domainname: ${LOCAL_DOMAIN}
hostname: s04 hostname: s04
container_name: s04 container_name: s04
restart: on-failure
networks: networks:
storage_int: storage_int:
internet: internet: