kexec-tools/SOURCES/kdump-lib-initramfs.sh

249 lines
6.8 KiB
Bash
Raw Normal View History

2019-08-02 19:33:45 +00:00
# These variables and functions are useful in 2nd kernel
. /lib/kdump-lib.sh
2021-03-30 11:32:07 +00:00
. /lib/kdump-logger.sh
2019-08-02 19:33:45 +00:00
KDUMP_PATH="/var/crash"
2021-03-30 11:32:07 +00:00
KDUMP_LOG_FILE="/run/initramfs/kexec-dmesg.log"
2019-08-02 19:33:45 +00:00
CORE_COLLECTOR=""
2021-03-30 11:32:07 +00:00
DEFAULT_CORE_COLLECTOR="makedumpfile -l --message-level 7 -d 31"
2019-08-02 19:33:45 +00:00
DMESG_COLLECTOR="/sbin/vmcore-dmesg"
FAILURE_ACTION="systemctl reboot -f"
DATEDIR=`date +%Y-%m-%d-%T`
HOST_IP='127.0.0.1'
DUMP_INSTRUCTION=""
SSH_KEY_LOCATION="/root/.ssh/kdump_id_rsa"
KDUMP_SCRIPT_DIR="/kdumpscripts"
DD_BLKSIZE=512
FINAL_ACTION="systemctl reboot -f"
KDUMP_CONF="/etc/kdump.conf"
KDUMP_PRE=""
KDUMP_POST=""
NEWROOT="/sysroot"
2020-07-28 14:00:53 +00:00
OPALCORE="/sys/firmware/opal/mpipl/core"
2019-08-02 19:33:45 +00:00
2021-03-30 11:32:07 +00:00
#initiate the kdump logger
dlog_init
if [ $? -ne 0 ]; then
echo "failed to initiate the kdump logger."
exit 1
fi
2019-08-02 19:33:45 +00:00
get_kdump_confs()
{
local config_opt config_val
while read config_opt config_val;
do
# remove inline comments after the end of a directive.
case "$config_opt" in
path)
KDUMP_PATH="$config_val"
;;
core_collector)
[ -n "$config_val" ] && CORE_COLLECTOR="$config_val"
;;
sshkey)
if [ -f "$config_val" ]; then
SSH_KEY_LOCATION=$config_val
fi
;;
kdump_pre)
KDUMP_PRE="$config_val"
;;
kdump_post)
KDUMP_POST="$config_val"
;;
fence_kdump_args)
FENCE_KDUMP_ARGS="$config_val"
;;
fence_kdump_nodes)
FENCE_KDUMP_NODES="$config_val"
;;
failure_action|default)
case $config_val in
shell)
FAILURE_ACTION="kdump_emergency_shell"
;;
reboot)
2020-01-21 18:24:10 +00:00
FAILURE_ACTION="systemctl reboot -f && exit"
2019-08-02 19:33:45 +00:00
;;
halt)
2020-01-21 18:24:10 +00:00
FAILURE_ACTION="halt && exit"
2019-08-02 19:33:45 +00:00
;;
poweroff)
2020-01-21 18:24:10 +00:00
FAILURE_ACTION="systemctl poweroff -f && exit"
2019-08-02 19:33:45 +00:00
;;
dump_to_rootfs)
FAILURE_ACTION="dump_to_rootfs"
;;
esac
;;
final_action)
case $config_val in
reboot)
FINAL_ACTION="systemctl reboot -f"
;;
halt)
FINAL_ACTION="halt"
;;
poweroff)
FINAL_ACTION="systemctl poweroff -f"
;;
esac
;;
esac
done <<< "$(read_strip_comments $KDUMP_CONF)"
if [ -z "$CORE_COLLECTOR" ]; then
CORE_COLLECTOR="$DEFAULT_CORE_COLLECTOR"
if is_ssh_dump_target || is_raw_dump_target; then
CORE_COLLECTOR="$CORE_COLLECTOR -F"
fi
fi
}
2021-03-30 11:32:07 +00:00
# store the kexec kernel log to a file.
save_log()
{
dmesg -T > $KDUMP_LOG_FILE
if command -v journalctl > /dev/null; then
journalctl -ab >> $KDUMP_LOG_FILE
fi
2021-10-06 14:28:37 +00:00
chmod 600 $KDUMP_LOG_FILE
2021-03-30 11:32:07 +00:00
}
2020-07-28 14:00:53 +00:00
# dump_fs <mount point>
2019-08-02 19:33:45 +00:00
dump_fs()
{
2021-03-30 11:32:07 +00:00
local _exitcode
2020-07-28 14:00:53 +00:00
local _mp=$1
2021-03-30 11:32:07 +00:00
ddebug "dump_fs _mp=$_mp"
if ! is_mounted "$_mp"; then
dinfo "dump path \"$_mp\" is not mounted, trying to mount..."
mount --target $_mp
if [ $? -ne 0 ]; then
derror "failed to dump to \"$_mp\", it's not a mount point!"
return 1
2020-01-21 18:24:10 +00:00
fi
2019-08-02 19:33:45 +00:00
fi
# Remove -F in makedumpfile case. We don't want a flat format dump here.
[[ $CORE_COLLECTOR = *makedumpfile* ]] && CORE_COLLECTOR=`echo $CORE_COLLECTOR | sed -e "s/-F//g"`
2021-03-30 11:32:07 +00:00
dinfo "saving to $_mp/$KDUMP_PATH/$HOST_IP-$DATEDIR/"
2019-08-02 19:33:45 +00:00
mount -o remount,rw $_mp || return 1
mkdir -p $_mp/$KDUMP_PATH/$HOST_IP-$DATEDIR || return 1
save_vmcore_dmesg_fs ${DMESG_COLLECTOR} "$_mp/$KDUMP_PATH/$HOST_IP-$DATEDIR/"
2020-07-28 14:00:53 +00:00
save_opalcore_fs "$_mp/$KDUMP_PATH/$HOST_IP-$DATEDIR/"
2019-08-02 19:33:45 +00:00
2021-03-30 11:32:07 +00:00
dinfo "saving vmcore"
$CORE_COLLECTOR /proc/vmcore $_mp/$KDUMP_PATH/$HOST_IP-$DATEDIR/vmcore-incomplete
_exitcode=$?
if [ $_exitcode -eq 0 ]; then
2023-03-28 08:41:10 +00:00
sync -f "$_mp/$KDUMP_PATH/$HOST_IP-$DATEDIR/vmcore-incomplete"
_sync_exitcode=$?
if [ $_sync_exitcode -eq 0 ]; then
mv "$_mp/$KDUMP_PATH/$HOST_IP-$DATEDIR/vmcore-incomplete" "$_mp/$KDUMP_PATH/$HOST_IP-$DATEDIR/vmcore"
dinfo "saving vmcore complete"
else
derror "sync vmcore failed, _exitcode:$_sync_exitcode"
return 1
fi
2021-03-30 11:32:07 +00:00
else
derror "saving vmcore failed, _exitcode:$_exitcode"
fi
2019-08-02 19:33:45 +00:00
2021-03-30 11:32:07 +00:00
dinfo "saving the $KDUMP_LOG_FILE to $_mp/$KDUMP_PATH/$HOST_IP-$DATEDIR/"
save_log
mv $KDUMP_LOG_FILE $_mp/$KDUMP_PATH/$HOST_IP-$DATEDIR/
if [ $_exitcode -ne 0 ]; then
return 1
fi
2020-01-21 18:24:10 +00:00
2019-08-02 19:33:45 +00:00
# improper kernel cmdline can cause the failure of echo, we can ignore this kind of failure
return 0
}
save_vmcore_dmesg_fs() {
local _dmesg_collector=$1
local _path=$2
2021-03-30 11:32:07 +00:00
dinfo "saving vmcore-dmesg.txt to ${_path}"
2019-08-02 19:33:45 +00:00
$_dmesg_collector /proc/vmcore > ${_path}/vmcore-dmesg-incomplete.txt
_exitcode=$?
if [ $_exitcode -eq 0 ]; then
mv ${_path}/vmcore-dmesg-incomplete.txt ${_path}/vmcore-dmesg.txt
2021-10-06 14:28:37 +00:00
chmod 600 ${_path}/vmcore-dmesg.txt
2019-08-02 19:33:45 +00:00
# Make sure file is on disk. There have been instances where later
# saving vmcore failed and system rebooted without sync and there
# was no vmcore-dmesg.txt available.
sync
2021-03-30 11:32:07 +00:00
dinfo "saving vmcore-dmesg.txt complete"
2019-08-02 19:33:45 +00:00
else
2021-03-30 11:32:07 +00:00
derror "saving vmcore-dmesg.txt failed"
2019-08-02 19:33:45 +00:00
fi
}
2020-07-28 14:00:53 +00:00
save_opalcore_fs() {
local _path=$1
if [ ! -f $OPALCORE ]; then
# Check if we are on an old kernel that uses a different path
if [ -f /sys/firmware/opal/core ]; then
OPALCORE="/sys/firmware/opal/core"
else
return 0
fi
fi
2021-03-30 11:32:07 +00:00
dinfo "saving opalcore:$OPALCORE to ${_path}/opalcore"
2020-07-28 14:00:53 +00:00
cp $OPALCORE ${_path}/opalcore
if [ $? -ne 0 ]; then
2021-03-30 11:32:07 +00:00
derror "saving opalcore failed"
2020-07-28 14:00:53 +00:00
return 1
fi
sync
2021-03-30 11:32:07 +00:00
dinfo "saving opalcore complete"
2020-07-28 14:00:53 +00:00
return 0
}
2019-08-02 19:33:45 +00:00
dump_to_rootfs()
{
2021-03-30 11:32:07 +00:00
dinfo "Trying to bring up rootfs device"
2019-08-02 19:33:45 +00:00
systemctl start dracut-initqueue
2021-03-30 11:32:07 +00:00
dinfo "Waiting for rootfs mount, will timeout after 90 seconds"
2019-08-02 19:33:45 +00:00
systemctl start sysroot.mount
2021-03-30 11:32:07 +00:00
ddebug "NEWROOT=$NEWROOT"
2019-08-02 19:33:45 +00:00
dump_fs $NEWROOT
}
kdump_emergency_shell()
{
echo "PS1=\"kdump:\\\${PWD}# \"" >/etc/profile
2021-03-30 11:32:07 +00:00
ddebug "Switching to dracut emergency..."
2019-08-02 19:33:45 +00:00
/bin/dracut-emergency
rm -f /etc/profile
}
do_failure_action()
{
2021-03-30 11:32:07 +00:00
dinfo "Executing failure action $FAILURE_ACTION"
2019-08-02 19:33:45 +00:00
eval $FAILURE_ACTION
}
do_final_action()
{
2021-03-30 11:32:07 +00:00
dinfo "Executing final action $FINAL_ACTION"
2019-08-02 19:33:45 +00:00
eval $FINAL_ACTION
}