diff options
Diffstat (limited to 'sys/contrib/openzfs/scripts/zloop.sh')
-rwxr-xr-x | sys/contrib/openzfs/scripts/zloop.sh | 304 |
1 files changed, 304 insertions, 0 deletions
diff --git a/sys/contrib/openzfs/scripts/zloop.sh b/sys/contrib/openzfs/scripts/zloop.sh new file mode 100755 index 000000000000..3d9baaf0e2b8 --- /dev/null +++ b/sys/contrib/openzfs/scripts/zloop.sh @@ -0,0 +1,304 @@ +#!/usr/bin/env bash + +# +# CDDL HEADER START +# +# This file and its contents are supplied under the terms of the +# Common Development and Distribution License ("CDDL"), version 1.0. +# You may only use this file in accordance with the terms of version +# 1.0 of the CDDL. +# +# A full copy of the text of the CDDL should have accompanied this +# source. A copy of the CDDL is also available via the Internet at +# http://www.illumos.org/license/CDDL. +# +# CDDL HEADER END +# + +# +# Copyright (c) 2015 by Delphix. All rights reserved. +# Copyright (C) 2016 Lawrence Livermore National Security, LLC. +# + +BASE_DIR=$(dirname "$0") +SCRIPT_COMMON=common.sh +if [ -f "${BASE_DIR}/${SCRIPT_COMMON}" ]; then + . "${BASE_DIR}/${SCRIPT_COMMON}" +else + echo "Missing helper script ${SCRIPT_COMMON}" && exit 1 +fi + +# shellcheck disable=SC2034 +PROG=zloop.sh +GDB=${GDB:-gdb} + +DEFAULTWORKDIR=/var/tmp +DEFAULTCOREDIR=/var/tmp/zloop + +function usage +{ + echo -e "\n$0 [-t <timeout>] [ -s <vdev size> ] [-c <dump directory>]" \ + "[ -- [extra ztest parameters]]\n" \ + "\n" \ + " This script runs ztest repeatedly with randomized arguments.\n" \ + " If a crash is encountered, the ztest logs, any associated\n" \ + " vdev files, and core file (if one exists) are moved to the\n" \ + " output directory ($DEFAULTCOREDIR by default). Any options\n" \ + " after the -- end-of-options marker will be passed to ztest.\n" \ + "\n" \ + " Options:\n" \ + " -t Total time to loop for, in seconds. If not provided,\n" \ + " zloop runs forever.\n" \ + " -s Size of vdev devices.\n" \ + " -f Specify working directory for ztest vdev files.\n" \ + " -c Specify a core dump directory to use.\n" \ + " -m Max number of core dumps to allow before exiting.\n" \ + " -l Create 'ztest.core.N' symlink to core directory.\n" \ + " -h Print this help message.\n" \ + "" >&2 +} + +function or_die +{ + # shellcheck disable=SC2068 + $@ + # shellcheck disable=SC2181 + if [[ $? -ne 0 ]]; then + # shellcheck disable=SC2145 + echo "Command failed: $@" + exit 1 + fi +} + +case $(uname) in +FreeBSD) + coreglob="z*.core" + ;; +Linux) + # core file helpers + origcorepattern="$(cat /proc/sys/kernel/core_pattern)" + coreglob="$(grep -E -o '^([^|%[:space:]]*)' /proc/sys/kernel/core_pattern)*" + + if [[ $coreglob = "*" ]]; then + echo "Setting core file pattern..." + echo "core" > /proc/sys/kernel/core_pattern + coreglob="$(grep -E -o '^([^|%[:space:]]*)' \ + /proc/sys/kernel/core_pattern)*" + fi + ;; +*) + exit 1 + ;; +esac + +function core_file +{ + # shellcheck disable=SC2012 disable=2086 + printf "%s" "$(ls -tr1 $coreglob 2> /dev/null | head -1)" +} + +function core_prog +{ + prog=$ZTEST + core_id=$($GDB --batch -c "$1" | grep "Core was generated by" | \ + tr \' ' ') + # shellcheck disable=SC2076 + if [[ "$core_id" =~ "zdb " ]]; then + prog=$ZDB + fi + printf "%s" "$prog" +} + +function store_core +{ + core="$(core_file)" + if [[ $ztrc -ne 0 ]] || [[ -f "$core" ]]; then + df -h "$workdir" >>ztest.out + coreid=$(date "+zloop-%y%m%d-%H%M%S") + foundcrashes=$((foundcrashes + 1)) + + # zdb debugging + zdbcmd="$ZDB -U "$workdir/zpool.cache" -dddMmDDG ztest" + zdbdebug=$($zdbcmd 2>&1) + echo -e "$zdbcmd\n" >>ztest.zdb + echo "$zdbdebug" >>ztest.zdb + + dest=$coredir/$coreid + or_die mkdir -p "$dest" + or_die mkdir -p "$dest/vdev" + + if [[ $symlink -ne 0 ]]; then + or_die ln -sf "$dest" ztest.core.$foundcrashes + fi + + echo "*** ztest crash found - moving logs to $dest" + + or_die mv ztest.history "$dest/" + or_die mv ztest.zdb "$dest/" + or_die mv ztest.out "$dest/" + or_die mv "$workdir/ztest*" "$dest/vdev/" + + if [[ -e "$workdir/zpool.cache" ]]; then + or_die mv "$workdir/zpool.cache" "$dest/vdev/" + fi + + # check for core + if [[ -f "$core" ]]; then + coreprog=$(core_prog "$core") + coredebug=$($GDB --batch --quiet \ + -ex "set print thread-events off" \ + -ex "printf \"*\n* Backtrace \n*\n\"" \ + -ex "bt" \ + -ex "printf \"*\n* Libraries \n*\n\"" \ + -ex "info sharedlib" \ + -ex "printf \"*\n* Threads (full) \n*\n\"" \ + -ex "info threads" \ + -ex "printf \"*\n* Backtraces \n*\n\"" \ + -ex "thread apply all bt" \ + -ex "printf \"*\n* Backtraces (full) \n*\n\"" \ + -ex "thread apply all bt full" \ + -ex "quit" "$coreprog" "$core" 2>&1 | \ + grep -v "New LWP") + + # Dump core + logs to stored directory + echo "$coredebug" >>"$dest/ztest.gdb" + or_die mv "$core" "$dest/" + + # Record info in cores logfile + echo "*** core @ $coredir/$coreid/$core:" | \ + tee -a ztest.cores + fi + + if [[ $coremax -gt 0 ]] && + [[ $foundcrashes -ge $coremax ]]; then + echo "exiting... max $coremax allowed cores" + exit 1 + else + echo "continuing..." + fi + fi +} + +# parse arguments +# expected format: zloop [-t timeout] [-c coredir] [-- extra ztest args] +coredir=$DEFAULTCOREDIR +basedir=$DEFAULTWORKDIR +rundir="zloop-run" +timeout=0 +size="512m" +coremax=0 +symlink=0 +while getopts ":ht:m:s:c:f:l" opt; do + case $opt in + t ) [[ $OPTARG -gt 0 ]] && timeout=$OPTARG ;; + m ) [[ $OPTARG -gt 0 ]] && coremax=$OPTARG ;; + s ) [[ $OPTARG ]] && size=$OPTARG ;; + c ) [[ $OPTARG ]] && coredir=$OPTARG ;; + f ) [[ $OPTARG ]] && basedir=$(readlink -f "$OPTARG") ;; + l ) symlink=1 ;; + h ) usage + exit 2 + ;; + * ) echo "Invalid argument: -$OPTARG"; + usage + exit 1 + esac +done +# pass remaining arguments on to ztest +shift $((OPTIND - 1)) + +# enable core dumps +ulimit -c unlimited +export ASAN_OPTIONS=abort_on_error=1:disable_coredump=0 + +if [[ -f "$(core_file)" ]]; then + echo -n "There's a core dump here you might want to look at first... " + core_file + echo + exit 1 +fi + +if [[ ! -d $coredir ]]; then + echo "core dump directory ($coredir) does not exist, creating it." + or_die mkdir -p "$coredir" +fi + +if [[ ! -w $coredir ]]; then + echo "core dump directory ($coredir) is not writable." + exit 1 +fi + +or_die rm -f ztest.history +or_die rm -f ztest.zdb +or_die rm -f ztest.cores + +ztrc=0 # ztest return value +foundcrashes=0 # number of crashes found so far +starttime=$(date +%s) +curtime=$starttime + +# if no timeout was specified, loop forever. +while [[ $timeout -eq 0 ]] || [[ $curtime -le $((starttime + timeout)) ]]; do + zopt="-G -VVVVV" + + # start each run with an empty directory + workdir="$basedir/$rundir" + or_die rm -rf "$workdir" + or_die mkdir "$workdir" + + # switch between common arrangements & fully randomized + if [[ $((RANDOM % 2)) -eq 0 ]]; then + mirrors=2 + raidz=0 + parity=1 + vdevs=2 + else + mirrors=$(((RANDOM % 3) * 1)) + parity=$(((RANDOM % 3) + 1)) + raidz=$((((RANDOM % 9) + parity + 1) * (RANDOM % 2))) + vdevs=$(((RANDOM % 3) + 3)) + fi + align=$(((RANDOM % 2) * 3 + 9)) + runtime=$((RANDOM % 100)) + passtime=$((RANDOM % (runtime / 3 + 1) + 10)) + + zopt="$zopt -m $mirrors" + zopt="$zopt -r $raidz" + zopt="$zopt -R $parity" + zopt="$zopt -v $vdevs" + zopt="$zopt -a $align" + zopt="$zopt -T $runtime" + zopt="$zopt -P $passtime" + zopt="$zopt -s $size" + zopt="$zopt -f $workdir" + + # shellcheck disable=SC2124 + cmd="$ZTEST $zopt $@" + desc="$(date '+%m/%d %T') $cmd" + echo "$desc" | tee -a ztest.history + echo "$desc" >>ztest.out + $cmd >>ztest.out 2>&1 + ztrc=$? + grep -E '===|WARNING' ztest.out >>ztest.history + + store_core + + curtime=$(date +%s) +done + +echo "zloop finished, $foundcrashes crashes found" + +# restore core pattern. +case $(uname) in +Linux) + echo "$origcorepattern" > /proc/sys/kernel/core_pattern + ;; +*) + ;; +esac + +uptime >>ztest.out + +if [[ $foundcrashes -gt 0 ]]; then + exit 1 +fi |