885285139e
There are many race conditions possible when multiple ceph-osd pods are initialized on the same host at the same time using shared metadata disks. The locked() function was introduced a while back to address these, but some commands weren't locked, locked() was being called all over the place, and there was a file descriptor leak in locked(). This change cleans that up by by maintaining a single, global file descriptor for the lock file that is only opened and closed once, and also by aliasing all of the commands that need to use locked() and removing explicit calls to locked() everywhere. The global_locked() function has also been removed as it isn't needed when individual commands that interact with disks use locked() properly. Change-Id: I0018cf0b3a25bced44c57c40e33043579c42de7a
156 lines
4.2 KiB
Smarty
156 lines
4.2 KiB
Smarty
#!/bin/bash
|
|
|
|
{{/*
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
*/}}
|
|
|
|
source /tmp/osd-common-ceph-volume.sh
|
|
|
|
set -ex
|
|
|
|
: "${OSD_SOFT_FORCE_ZAP:=1}"
|
|
: "${OSD_JOURNAL_DISK:=}"
|
|
|
|
if [ "x${STORAGE_TYPE%-*}" == "xdirectory" ]; then
|
|
export OSD_DEVICE="/var/lib/ceph/osd"
|
|
else
|
|
export OSD_DEVICE=$(readlink -f ${STORAGE_LOCATION})
|
|
fi
|
|
|
|
if [ "x$JOURNAL_TYPE" == "xdirectory" ]; then
|
|
export OSD_JOURNAL="/var/lib/ceph/journal"
|
|
else
|
|
export OSD_JOURNAL=$(readlink -f ${JOURNAL_LOCATION})
|
|
fi
|
|
|
|
if [[ -z "${OSD_DEVICE}" ]];then
|
|
echo "ERROR- You must provide a device to build your OSD ie: /dev/sdb"
|
|
exit 1
|
|
fi
|
|
|
|
if [[ ! -b "${OSD_DEVICE}" ]]; then
|
|
echo "ERROR- The device pointed by OSD_DEVICE ${OSD_DEVICE} doesn't exist !"
|
|
exit 1
|
|
fi
|
|
|
|
CEPH_DISK_OPTIONS=""
|
|
CEPH_OSD_OPTIONS=""
|
|
|
|
udev_settle
|
|
|
|
OSD_ID=$(ceph-volume inventory ${OSD_DEVICE} | grep "osd id" | awk '{print $3}')
|
|
simple_activate=0
|
|
if [[ -z ${OSD_ID} ]]; then
|
|
echo "Looks like ceph-disk has been used earlier to activate the OSD."
|
|
tmpmnt=$(mktemp -d)
|
|
mount ${OSD_DEVICE}1 ${tmpmnt}
|
|
OSD_ID=$(cat ${tmpmnt}/whoami)
|
|
umount ${tmpmnt}
|
|
simple_activate=1
|
|
fi
|
|
OSD_FSID=$(ceph-volume inventory ${OSD_DEVICE} | grep "osd fsid" | awk '{print $3}')
|
|
if [[ -z ${OSD_FSID} ]]; then
|
|
echo "Looks like ceph-disk has been used earlier to activate the OSD."
|
|
tmpmnt=$(mktemp -d)
|
|
mount ${OSD_DEVICE}1 ${tmpmnt}
|
|
OSD_FSID=$(cat ${tmpmnt}/fsid)
|
|
umount ${tmpmnt}
|
|
simple_activate=1
|
|
fi
|
|
OSD_PATH="${OSD_PATH_BASE}-${OSD_ID}"
|
|
OSD_KEYRING="${OSD_PATH}/keyring"
|
|
|
|
mkdir -p ${OSD_PATH}
|
|
|
|
if [[ ${simple_activate} -eq 1 ]]; then
|
|
ceph-volume simple activate --no-systemd ${OSD_ID} ${OSD_FSID}
|
|
else
|
|
ceph-volume lvm -v \
|
|
--setuser ceph \
|
|
--setgroup disk \
|
|
activate ${CEPH_DISK_OPTIONS} \
|
|
--auto-detect-objectstore \
|
|
--no-systemd ${OSD_ID} ${OSD_FSID}
|
|
fi
|
|
|
|
# NOTE(stevetaylor): Set the OSD's crush weight (use noin flag to prevent rebalancing if necessary)
|
|
OSD_WEIGHT=$(get_osd_crush_weight_from_device ${OSD_DEVICE})
|
|
# NOTE(supamatt): add or move the OSD's CRUSH location
|
|
crush_location
|
|
|
|
if [ "${OSD_BLUESTORE:-0}" -ne 1 ]; then
|
|
if [ -n "${OSD_JOURNAL}" ]; then
|
|
if [ -b "${OSD_JOURNAL}" ]; then
|
|
OSD_JOURNAL_DISK="$(readlink -f ${OSD_PATH}/journal)"
|
|
if [ -z "${OSD_JOURNAL_DISK}" ]; then
|
|
echo "ERROR: Unable to find journal device ${OSD_JOURNAL_DISK}"
|
|
exit 1
|
|
else
|
|
OSD_JOURNAL="${OSD_JOURNAL_DISK}"
|
|
if [ -e "${OSD_PATH}/run_mkjournal" ]; then
|
|
ceph-osd -i ${OSD_ID} --mkjournal
|
|
rm -rf ${OSD_PATH}/run_mkjournal
|
|
fi
|
|
fi
|
|
fi
|
|
if [ "x${JOURNAL_TYPE}" == "xdirectory" ]; then
|
|
OSD_JOURNAL="${OSD_JOURNAL}/journal.${OSD_ID}"
|
|
touch ${OSD_JOURNAL}
|
|
wait_for_file "${OSD_JOURNAL}"
|
|
else
|
|
if [ ! -b "${OSD_JOURNAL}" ]; then
|
|
echo "ERROR: Unable to find journal device ${OSD_JOURNAL}"
|
|
exit 1
|
|
else
|
|
chown ceph. "${OSD_JOURNAL}"
|
|
fi
|
|
fi
|
|
else
|
|
wait_for_file "${OSD_JOURNAL}"
|
|
chown ceph. "${OSD_JOURNAL}"
|
|
fi
|
|
fi
|
|
|
|
# NOTE(supamatt): Just in case permissions do not align up, we recursively set them correctly.
|
|
if [ $(stat -c%U ${OSD_PATH}) != ceph ]; then
|
|
chown -R ceph. ${OSD_PATH};
|
|
fi
|
|
|
|
# NOTE(gagehugo): Writing the OSD_ID to tmp for logging
|
|
echo "${OSD_ID}" > /tmp/osd-id
|
|
|
|
if [ "x${JOURNAL_TYPE}" == "xdirectory" ]; then
|
|
chown -R ceph. /var/lib/ceph/journal
|
|
ceph-osd \
|
|
--cluster ceph \
|
|
--osd-data ${OSD_PATH} \
|
|
--osd-journal ${OSD_JOURNAL} \
|
|
-f \
|
|
-i ${OSD_ID} \
|
|
--setuser ceph \
|
|
--setgroup disk \
|
|
--mkjournal
|
|
fi
|
|
|
|
exec /usr/bin/ceph-osd \
|
|
--cluster ${CLUSTER} \
|
|
${CEPH_OSD_OPTIONS} \
|
|
-f \
|
|
-i ${OSD_ID} \
|
|
--setuser ceph \
|
|
--setgroup disk & echo $! > /run/ceph-osd.pid
|
|
wait
|
|
|
|
# Clean up resources held by the common script
|
|
common_cleanup
|