mirror of
https://github.com/openzfs/zfs.git
synced 2025-10-01 11:26:49 +00:00

A single slow responding disk can affect the overall read performance of a raidz group. When a raidz child disk is determined to be a persistent slow outlier, then have it sit out during reads for a period of time. The raidz group can use parity to reconstruct the data that was skipped. Each time a slow disk is placed into a sit out period, its `vdev_stat.vs_slow_ios count` is incremented and a zevent class `ereport.fs.zfs.delay` is posted. The length of the sit out period can be changed using the `raid_read_sit_out_secs` module parameter. Setting it to zero disables slow outlier detection. Sponsored-by: Klara, Inc. Sponsored-by: Wasabi Technology, Inc. Reviewed-by: Brian Behlendorf <behlendorf1@llnl.gov> Signed-off-by: Paul Dagnelie <paul.dagnelie@klarasystems.com> Contributions-by: Don Brady <don.brady@klarasystems.com> Contributions-by: Brian Behlendorf <behlendorf1@llnl.gov> Closes #17227
107 lines
3.2 KiB
C
107 lines
3.2 KiB
C
// SPDX-License-Identifier: BSD-2-Clause
|
|
/*
|
|
* Copyright (c) 2007 Pawel Jakub Dawidek <pjd@FreeBSD.org>
|
|
* All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions
|
|
* are met:
|
|
* 1. Redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer.
|
|
* 2. Redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE AUTHORS AND CONTRIBUTORS ``AS IS'' AND
|
|
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE LIABLE
|
|
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
|
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
|
|
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
|
|
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
|
|
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
|
|
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
|
|
* SUCH DAMAGE.
|
|
*/
|
|
|
|
#ifndef _OPENSOLARIS_SYS_TIME_H_
|
|
#define _OPENSOLARIS_SYS_TIME_H_
|
|
#pragma once
|
|
#include_next <sys/time.h>
|
|
#include <sys/debug.h>
|
|
#ifndef _SYS_KERNEL_H_
|
|
extern int hz;
|
|
#endif
|
|
|
|
#define SEC 1
|
|
#define MILLISEC 1000UL
|
|
#define MICROSEC 1000000UL
|
|
#define NANOSEC 1000000000UL
|
|
#define TIME_MAX LLONG_MAX
|
|
|
|
#define MSEC2NSEC(m) ((hrtime_t)(m) * (NANOSEC / MILLISEC))
|
|
#define NSEC2MSEC(n) ((n) / (NANOSEC / MILLISEC))
|
|
|
|
#define USEC2NSEC(m) ((hrtime_t)(m) * (NANOSEC / MICROSEC))
|
|
#define NSEC2USEC(n) ((n) / (NANOSEC / MICROSEC))
|
|
|
|
#define NSEC2SEC(n) ((n) / (NANOSEC / SEC))
|
|
#define SEC2NSEC(m) ((hrtime_t)(m) * (NANOSEC / SEC))
|
|
|
|
typedef longlong_t hrtime_t;
|
|
|
|
#if defined(__i386__) || defined(__powerpc__)
|
|
#define TIMESPEC_OVERFLOW(ts) \
|
|
((ts)->tv_sec < INT32_MIN || (ts)->tv_sec > INT32_MAX)
|
|
#else
|
|
#define TIMESPEC_OVERFLOW(ts) \
|
|
((ts)->tv_sec < INT64_MIN || (ts)->tv_sec > INT64_MAX)
|
|
#endif
|
|
|
|
#define SEC_TO_TICK(sec) ((sec) * hz)
|
|
#define NSEC_TO_TICK(nsec) ((nsec) / (NANOSEC / hz))
|
|
|
|
static __inline hrtime_t
|
|
getlrtime(void)
|
|
{
|
|
struct timespec ts;
|
|
hrtime_t nsec;
|
|
|
|
getnanouptime(&ts);
|
|
nsec = ((hrtime_t)ts.tv_sec * NANOSEC) + ts.tv_nsec;
|
|
return (nsec);
|
|
}
|
|
|
|
static __inline hrtime_t
|
|
gethrtime(void)
|
|
{
|
|
struct timespec ts;
|
|
hrtime_t nsec;
|
|
|
|
nanouptime(&ts);
|
|
nsec = ((hrtime_t)ts.tv_sec * NANOSEC) + ts.tv_nsec;
|
|
return (nsec);
|
|
}
|
|
|
|
#define gethrestime_sec() (time_second)
|
|
#define gethrestime(ts) getnanotime(ts)
|
|
#define gethrtime_waitfree() gethrtime()
|
|
|
|
extern int nsec_per_tick; /* nanoseconds per clock tick */
|
|
|
|
#define ddi_get_lbolt64() \
|
|
(int64_t)(((getsbinuptime() >> 16) * hz) >> 16)
|
|
#define ddi_get_lbolt() (clock_t)ddi_get_lbolt64()
|
|
|
|
#else
|
|
|
|
static __inline hrtime_t
|
|
gethrtime(void)
|
|
{
|
|
struct timespec ts;
|
|
clock_gettime(CLOCK_UPTIME, &ts);
|
|
return (((uint64_t)ts.tv_sec) * NANOSEC + ts.tv_nsec);
|
|
}
|
|
#endif /* !_OPENSOLARIS_SYS_TIME_H_ */
|