309278389e
This change implements the reccomended rolling restart procedure[0] for elasticsearch-data pods. [0] https://www.elastic.co/guide/en/elasticsearch/reference/7.x/restart-cluster.html#restart-cluster-rolling Change-Id: I935b3681999e9bda616898f2b5e01f582ee54ed9
128 lines
4.8 KiB
Smarty
128 lines
4.8 KiB
Smarty
#!/bin/bash
|
|
{{/*
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
*/}}
|
|
|
|
{{- $envAll := . }}
|
|
|
|
set -e
|
|
COMMAND="${@:-start}"
|
|
|
|
function initiate_keystore () {
|
|
bin/elasticsearch-keystore create
|
|
echo ${S3_ACCESS_KEY} | /usr/share/elasticsearch/bin/elasticsearch-keystore add -xf s3.client.default.access_key
|
|
echo ${S3_SECRET_KEY} | /usr/share/elasticsearch/bin/elasticsearch-keystore add -xf s3.client.default.secret_key
|
|
}
|
|
|
|
function start () {
|
|
ulimit -l unlimited
|
|
initiate_keystore
|
|
exec /usr/local/bin/docker-entrypoint.sh elasticsearch
|
|
}
|
|
|
|
function stop () {
|
|
kill -TERM 1
|
|
}
|
|
|
|
function wait_to_join() {
|
|
joined=$(curl -s -K- <<< "--user ${ELASTICSEARCH_USERNAME}:${ELASTICSEARCH_PASSWORD}" "${ELASTICSEARCH_ENDPOINT}/_cat/nodes" | grep -w $NODE_NAME || true )
|
|
|
|
while [ -z "$joined" ]; do
|
|
sleep 5
|
|
joined=$(curl -s -K- <<< "--user ${ELASTICSEARCH_USERNAME}:${ELASTICSEARCH_PASSWORD}" "${ELASTICSEARCH_ENDPOINT}/_cat/nodes" | grep -w $NODE_NAME || true )
|
|
done
|
|
}
|
|
|
|
function allocate_data_node () {
|
|
if [ -f /data/restarting ]; then
|
|
rm /data/restarting
|
|
echo "Node ${NODE_NAME} has restarted. Waiting to rejoin the cluster."
|
|
wait_to_join
|
|
|
|
echo "Re-enabling Replica Shard Allocation"
|
|
curl -s -K- <<< "--user ${ELASTICSEARCH_USERNAME}:${ELASTICSEARCH_PASSWORD}" -XPUT -H 'Content-Type: application/json' \
|
|
"${ELASTICSEARCH_ENDPOINT}/_cluster/settings" -d "{
|
|
\"persistent\": {
|
|
\"cluster.routing.allocation.enable\": null
|
|
}
|
|
}"
|
|
fi
|
|
}
|
|
|
|
function start_master_node () {
|
|
ulimit -l unlimited
|
|
initiate_keystore
|
|
if [ ! -f {{ $envAll.Values.conf.elasticsearch.config.path.data }}/cluster-bootstrap.txt ];
|
|
then
|
|
{{ if empty $envAll.Values.conf.elasticsearch.config.cluster.initial_master_nodes -}}
|
|
{{- $_ := set $envAll.Values "__eligible_masters" ( list ) }}
|
|
{{- range $podInt := until ( atoi (print $envAll.Values.pod.replicas.master ) ) }}
|
|
{{- $eligibleMaster := printf "elasticsearch-master-%s" (toString $podInt) }}
|
|
{{- $__eligible_masters := append $envAll.Values.__eligible_masters $eligibleMaster }}
|
|
{{- $_ := set $envAll.Values "__eligible_masters" $__eligible_masters }}
|
|
{{- end -}}
|
|
{{- $masters := include "helm-toolkit.utils.joinListWithComma" $envAll.Values.__eligible_masters -}}
|
|
echo {{$masters}} >> {{ $envAll.Values.conf.elasticsearch.config.path.data }}/cluster-bootstrap.txt
|
|
exec /usr/local/bin/docker-entrypoint.sh elasticsearch -Ecluster.initial_master_nodes={{$masters}}
|
|
{{- end }}
|
|
else
|
|
exec /usr/local/bin/docker-entrypoint.sh elasticsearch
|
|
fi
|
|
}
|
|
|
|
function start_data_node () {
|
|
ulimit -l unlimited
|
|
initiate_keystore
|
|
allocate_data_node &
|
|
/usr/local/bin/docker-entrypoint.sh elasticsearch &
|
|
function drain_data_node () {
|
|
|
|
# Implement the Rolling Restart Protocol Described Here:
|
|
# https://www.elastic.co/guide/en/elasticsearch/reference/7.x/restart-cluster.html#restart-cluster-rolling
|
|
|
|
echo "Disabling Replica Shard Allocation"
|
|
curl -s -K- <<< "--user ${ELASTICSEARCH_USERNAME}:${ELASTICSEARCH_PASSWORD}" -XPUT -H 'Content-Type: application/json' \
|
|
"${ELASTICSEARCH_ENDPOINT}/_cluster/settings" -d "{
|
|
\"persistent\": {
|
|
\"cluster.routing.allocation.enable\": \"primaries\"
|
|
}
|
|
}"
|
|
|
|
# If version < 7.6 use _flush/synced; otherwise use _flush
|
|
# https://www.elastic.co/guide/en/elasticsearch/reference/current/indices-synced-flush-api.html#indices-synced-flush-api
|
|
|
|
version=$(curl -s -K- <<< "--user ${ELASTICSEARCH_USERNAME}:${ELASTICSEARCH_PASSWORD}" "${ELASTICSEARCH_ENDPOINT}/" | jq -r .version.number)
|
|
|
|
if [[ $version =~ "7.1" ]]; then
|
|
action="_flush/synced"
|
|
else
|
|
action="_flush"
|
|
fi
|
|
|
|
curl -s -K- <<< "--user ${ELASTICSEARCH_USERNAME}:${ELASTICSEARCH_PASSWORD}" -XPOST "${ELASTICSEARCH_ENDPOINT}/$action"
|
|
|
|
# TODO: Check the response of synced flush operations to make sure there are no failures.
|
|
# Synced flush operations that fail due to pending indexing operations are listed in the response body,
|
|
# although the request itself still returns a 200 OK status. If there are failures, reissue the request.
|
|
# (The only side effect of not doing so is slower start up times. See flush documentation linked above)
|
|
|
|
touch /data/restarting
|
|
echo "Node ${NODE_NAME} is ready to shutdown"
|
|
kill -TERM 1
|
|
}
|
|
trap drain_data_node TERM EXIT HUP INT
|
|
wait
|
|
}
|
|
|
|
$COMMAND
|