mirror of
https://git.proxmox.com/git/mirror_zfs.git
synced 2025-01-25 01:16:34 +03:00
3ec34e5527
Following the fix for 9018 (Replace kmem_cache_reap_now() with kmem_cache_reap_soon), the arc_reclaim_thread() no longer blocks while reaping. However, the code is still confusing and error-prone, because this thread has two responsibilities. We should instead separate this into two threads each with their own responsibility: 1. keep `arc_size` under `arc_c`, by calling `arc_adjust()`, which improves `arc_is_overflowing()` 2. keep enough free memory in the system, by calling `arc_kmem_reap_now()` plus `arc_shrink()`, which improves `arc_available_memory()`. Furthermore, we can use the zthr infrastructure to separate the "should we do something" from "do it" parts of the logic, and normalize the start up / shut down of the threads. Authored by: Brad Lewis <brad.lewis@delphix.com> Reviewed by: Matt Ahrens <mahrens@delphix.com> Reviewed by: Serapheim Dimitropoulos <serapheim@delphix.com> Reviewed by: Pavel Zakharov <pavel.zakharov@delphix.com> Reviewed by: Dan Kimmel <dan.kimmel@delphix.com> Reviewed by: Paul Dagnelie <pcd@delphix.com> Reviewed by: Dan McDonald <danmcd@joyent.com> Reviewed by: Tim Kordas <tim.kordas@joyent.com> Reviewed by: Tim Chase <tim@chase2k.com> Reviewed by: Brian Behlendorf <behlendorf1@llnl.gov> Ported-by: Brad Lewis <brad.lewis@delphix.com> Signed-off-by: Brad Lewis <brad.lewis@delphix.com> OpenZFS-issue: https://www.illumos.org/issues/9284 OpenZFS-commit: https://github.com/openzfs/openzfs/commit/de753e34f9 Closes #8165
188 lines
5.6 KiB
C
188 lines
5.6 KiB
C
/*
|
|
* Copyright (C) 2007-2010 Lawrence Livermore National Security, LLC.
|
|
* Copyright (C) 2007 The Regents of the University of California.
|
|
* Produced at Lawrence Livermore National Laboratory (cf, DISCLAIMER).
|
|
* Written by Brian Behlendorf <behlendorf1@llnl.gov>.
|
|
* UCRL-CODE-235197
|
|
*
|
|
* This file is part of the SPL, Solaris Porting Layer.
|
|
* For details, see <http://zfsonlinux.org/>.
|
|
*
|
|
* The SPL is free software; you can redistribute it and/or modify it
|
|
* under the terms of the GNU General Public License as published by the
|
|
* Free Software Foundation; either version 2 of the License, or (at your
|
|
* option) any later version.
|
|
*
|
|
* The SPL is distributed in the hope that it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
* for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License along
|
|
* with the SPL. If not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
#ifndef _SPL_KMEM_H
|
|
#define _SPL_KMEM_H
|
|
|
|
#include <sys/debug.h>
|
|
#include <linux/slab.h>
|
|
#include <linux/sched.h>
|
|
|
|
extern int kmem_debugging(void);
|
|
extern char *kmem_vasprintf(const char *fmt, va_list ap);
|
|
extern char *kmem_asprintf(const char *fmt, ...);
|
|
extern char *strdup(const char *str);
|
|
extern void strfree(char *str);
|
|
|
|
/*
|
|
* Memory allocation interfaces
|
|
*/
|
|
#define KM_SLEEP 0x0000 /* can block for memory; success guaranteed */
|
|
#define KM_NOSLEEP 0x0001 /* cannot block for memory; may fail */
|
|
#define KM_PUSHPAGE 0x0004 /* can block for memory; may use reserve */
|
|
#define KM_ZERO 0x1000 /* zero the allocation */
|
|
#define KM_VMEM 0x2000 /* caller is vmem_* wrapper */
|
|
|
|
#define KM_PUBLIC_MASK (KM_SLEEP | KM_NOSLEEP | KM_PUSHPAGE)
|
|
|
|
static int spl_fstrans_check(void);
|
|
|
|
/*
|
|
* Convert a KM_* flags mask to its Linux GFP_* counterpart. The conversion
|
|
* function is context aware which means that KM_SLEEP allocations can be
|
|
* safely used in syncing contexts which have set PF_FSTRANS.
|
|
*/
|
|
static inline gfp_t
|
|
kmem_flags_convert(int flags)
|
|
{
|
|
gfp_t lflags = __GFP_NOWARN | __GFP_COMP;
|
|
|
|
if (flags & KM_NOSLEEP) {
|
|
lflags |= GFP_ATOMIC | __GFP_NORETRY;
|
|
} else {
|
|
lflags |= GFP_KERNEL;
|
|
if (spl_fstrans_check())
|
|
lflags &= ~(__GFP_IO|__GFP_FS);
|
|
}
|
|
|
|
if (flags & KM_PUSHPAGE)
|
|
lflags |= __GFP_HIGH;
|
|
|
|
if (flags & KM_ZERO)
|
|
lflags |= __GFP_ZERO;
|
|
|
|
return (lflags);
|
|
}
|
|
|
|
typedef struct {
|
|
struct task_struct *fstrans_thread;
|
|
unsigned int saved_flags;
|
|
} fstrans_cookie_t;
|
|
|
|
/*
|
|
* Introduced in Linux 3.9, however this cannot be solely relied on before
|
|
* Linux 3.18 as it doesn't turn off __GFP_FS as it should.
|
|
*/
|
|
#ifdef PF_MEMALLOC_NOIO
|
|
#define __SPL_PF_MEMALLOC_NOIO (PF_MEMALLOC_NOIO)
|
|
#else
|
|
#define __SPL_PF_MEMALLOC_NOIO (0)
|
|
#endif
|
|
|
|
/*
|
|
* PF_FSTRANS is removed from Linux 4.12
|
|
*/
|
|
#ifdef PF_FSTRANS
|
|
#define __SPL_PF_FSTRANS (PF_FSTRANS)
|
|
#else
|
|
#define __SPL_PF_FSTRANS (0)
|
|
#endif
|
|
|
|
#define SPL_FSTRANS (__SPL_PF_FSTRANS|__SPL_PF_MEMALLOC_NOIO)
|
|
|
|
static inline fstrans_cookie_t
|
|
spl_fstrans_mark(void)
|
|
{
|
|
fstrans_cookie_t cookie;
|
|
|
|
BUILD_BUG_ON(SPL_FSTRANS == 0);
|
|
|
|
cookie.fstrans_thread = current;
|
|
cookie.saved_flags = current->flags & SPL_FSTRANS;
|
|
current->flags |= SPL_FSTRANS;
|
|
|
|
return (cookie);
|
|
}
|
|
|
|
static inline void
|
|
spl_fstrans_unmark(fstrans_cookie_t cookie)
|
|
{
|
|
ASSERT3P(cookie.fstrans_thread, ==, current);
|
|
ASSERT((current->flags & SPL_FSTRANS) == SPL_FSTRANS);
|
|
|
|
current->flags &= ~SPL_FSTRANS;
|
|
current->flags |= cookie.saved_flags;
|
|
}
|
|
|
|
static inline int
|
|
spl_fstrans_check(void)
|
|
{
|
|
return (current->flags & SPL_FSTRANS);
|
|
}
|
|
|
|
/*
|
|
* specifically used to check PF_FSTRANS flag, cannot be relied on for
|
|
* checking spl_fstrans_mark().
|
|
*/
|
|
static inline int
|
|
__spl_pf_fstrans_check(void)
|
|
{
|
|
return (current->flags & __SPL_PF_FSTRANS);
|
|
}
|
|
|
|
#ifdef HAVE_ATOMIC64_T
|
|
#define kmem_alloc_used_add(size) atomic64_add(size, &kmem_alloc_used)
|
|
#define kmem_alloc_used_sub(size) atomic64_sub(size, &kmem_alloc_used)
|
|
#define kmem_alloc_used_read() atomic64_read(&kmem_alloc_used)
|
|
#define kmem_alloc_used_set(size) atomic64_set(&kmem_alloc_used, size)
|
|
extern atomic64_t kmem_alloc_used;
|
|
extern unsigned long long kmem_alloc_max;
|
|
#else /* HAVE_ATOMIC64_T */
|
|
#define kmem_alloc_used_add(size) atomic_add(size, &kmem_alloc_used)
|
|
#define kmem_alloc_used_sub(size) atomic_sub(size, &kmem_alloc_used)
|
|
#define kmem_alloc_used_read() atomic_read(&kmem_alloc_used)
|
|
#define kmem_alloc_used_set(size) atomic_set(&kmem_alloc_used, size)
|
|
extern atomic_t kmem_alloc_used;
|
|
extern unsigned long long kmem_alloc_max;
|
|
#endif /* HAVE_ATOMIC64_T */
|
|
|
|
extern unsigned int spl_kmem_alloc_warn;
|
|
extern unsigned int spl_kmem_alloc_max;
|
|
|
|
#define kmem_alloc(sz, fl) spl_kmem_alloc((sz), (fl), __func__, __LINE__)
|
|
#define kmem_zalloc(sz, fl) spl_kmem_zalloc((sz), (fl), __func__, __LINE__)
|
|
#define kmem_free(ptr, sz) spl_kmem_free((ptr), (sz))
|
|
#define kmem_cache_reap_active spl_kmem_cache_reap_active
|
|
|
|
extern void *spl_kmem_alloc(size_t sz, int fl, const char *func, int line);
|
|
extern void *spl_kmem_zalloc(size_t sz, int fl, const char *func, int line);
|
|
extern void spl_kmem_free(const void *ptr, size_t sz);
|
|
|
|
/*
|
|
* The following functions are only available for internal use.
|
|
*/
|
|
extern void *spl_kmem_alloc_impl(size_t size, int flags, int node);
|
|
extern void *spl_kmem_alloc_debug(size_t size, int flags, int node);
|
|
extern void *spl_kmem_alloc_track(size_t size, int flags,
|
|
const char *func, int line, int node);
|
|
extern void spl_kmem_free_impl(const void *buf, size_t size);
|
|
extern void spl_kmem_free_debug(const void *buf, size_t size);
|
|
extern void spl_kmem_free_track(const void *buf, size_t size);
|
|
|
|
extern int spl_kmem_init(void);
|
|
extern void spl_kmem_fini(void);
|
|
extern int spl_kmem_cache_reap_active(void);
|
|
|
|
#endif /* _SPL_KMEM_H */
|