#include "opt_vm.h"
#include <sys/systm.h>
#include <sys/blockcount.h>
#include <sys/conf.h>
#include <sys/cpuset.h>
#include <sys/ipc.h>
#include <sys/jail.h>
#include <sys/limits.h>
#include <sys/lock.h>
#include <sys/mman.h>
#include <sys/mount.h>
#include <sys/kernel.h>
#include <sys/mutex.h>
#include <sys/pctrie.h>
#include <sys/proc.h>
#include <sys/refcount.h>
#include <sys/shm.h>
#include <sys/sx.h>
#include <sys/sysctl.h>
#include <sys/resourcevar.h>
#include <sys/refcount.h>
#include <sys/rwlock.h>
#include <sys/user.h>
#include <sys/vnode.h>
#include <sys/vmmeter.h>
#include <vm/vm.h>
#include <vm/vm_param.h>
#include <vm/pmap.h>
#include <vm/vm_map.h>
#include <vm/vm_object.h>
#include <vm/vm_page.h>
#include <vm/vm_pageout.h>
#include <vm/vm_pager.h>
#include <vm/vm_phys.h>
#include <vm/vm_pagequeue.h>
#include <vm/swap_pager.h>
#include <vm/vm_kern.h>
#include <vm/vm_extern.h>
#include <vm/vm_radix.h>
#include <vm/vm_reserv.h>
#include <vm/uma.h>
static int old_msync;
SYSCTL_INT(_vm, OID_AUTO, old_msync, CTLFLAG_RW, &old_msync, 0,
"Use old (insecure) msync behavior");
static boolean_t vm_object_page_remove_write(vm_page_t p, int flags,
boolean_t *allclean);
static void vm_object_backing_remove(vm_object_t object);
struct object_q vm_object_list;
struct mtx vm_object_list_mtx;
struct vm_object kernel_object_store;
static SYSCTL_NODE(_vm_stats, OID_AUTO, object, CTLFLAG_RD | CTLFLAG_MPSAFE, 0,
"VM object stats");
static COUNTER_U64_DEFINE_EARLY(object_collapses);
SYSCTL_COUNTER_U64(_vm_stats_object, OID_AUTO, collapses, CTLFLAG_RD,
&object_collapses,
"VM object collapses");
static COUNTER_U64_DEFINE_EARLY(object_bypasses);
SYSCTL_COUNTER_U64(_vm_stats_object, OID_AUTO, bypasses, CTLFLAG_RD,
&object_bypasses,
"VM object bypasses");
static COUNTER_U64_DEFINE_EARLY(object_collapse_waits);
SYSCTL_COUNTER_U64(_vm_stats_object, OID_AUTO, collapse_waits, CTLFLAG_RD,
&object_collapse_waits,
"Number of sleeps for collapse");
static uma_zone_t obj_zone;
static int vm_object_zinit(void *mem, int size, int flags);
#ifdef INVARIANTS
static void vm_object_zdtor(void *mem, int size, void *arg);
static void
vm_object_zdtor(void *mem, int size, void *arg)
{
vm_object_t object;
object = (vm_object_t)mem;
KASSERT(object->ref_count == 0,
("object %p ref_count = %d", object, object->ref_count));
KASSERT(vm_radix_is_empty(&object->rtree),
("object %p has resident pages in its trie", object));
#if VM_NRESERVLEVEL > 0
KASSERT(LIST_EMPTY(&object->rvq),
("object %p has reservations",
object));
#endif
KASSERT(!vm_object_busied(object),
("object %p busy = %d", object, blockcount_read(&object->busy)));
KASSERT(object->resident_page_count == 0,
("object %p resident_page_count = %d",
object, object->resident_page_count));
KASSERT(atomic_load_int(&object->shadow_count) == 0,
("object %p shadow_count = %d",
object, atomic_load_int(&object->shadow_count)));
KASSERT(object->type == OBJT_DEAD,
("object %p has non-dead type %d",
object, object->type));
KASSERT(object->charge == 0 && object->cred == NULL,
("object %p has non-zero charge %ju (%p)",
object, (uintmax_t)object->charge, object->cred));
}
#endif
static int
vm_object_zinit(void *mem, int size, int flags)
{
vm_object_t object;
object = (vm_object_t)mem;
rw_init_flags(&object->lock, "vmobject", RW_DUPOK | RW_NEW);
object->type = OBJT_DEAD;
vm_radix_init(&object->rtree);
refcount_init(&object->ref_count, 0);
blockcount_init(&object->paging_in_progress);
blockcount_init(&object->busy);
object->resident_page_count = 0;
atomic_store_int(&object->shadow_count, 0);
object->flags = OBJ_DEAD;
mtx_lock(&vm_object_list_mtx);
TAILQ_INSERT_TAIL(&vm_object_list, object, object_list);
mtx_unlock(&vm_object_list_mtx);
return (0);
}
static void
_vm_object_allocate(objtype_t type, vm_pindex_t size, u_short flags,
vm_object_t object, void *handle)
{
LIST_INIT(&object->shadow_head);
object->type = type;
object->flags = flags;
if ((flags & OBJ_SWAP) != 0) {
pctrie_init(&object->un_pager.swp.swp_blks);
object->un_pager.swp.writemappings = 0;
}
atomic_thread_fence_rel();
object->pg_color = 0;
object->size = size;
object->domain.dr_policy = NULL;
object->generation = 1;
object->cleangeneration = 1;
refcount_init(&object->ref_count, 1);
object->memattr = VM_MEMATTR_DEFAULT;
object->cred = NULL;
object->charge = 0;
object->handle = handle;
object->backing_object = NULL;
object->backing_object_offset = (vm_ooffset_t) 0;
#if VM_NRESERVLEVEL > 0
LIST_INIT(&object->rvq);
#endif
umtx_shm_object_init(object);
}
void
vm_object_init(void)
{
TAILQ_INIT(&vm_object_list);
mtx_init(&vm_object_list_mtx, "vm object_list", NULL, MTX_DEF);
rw_init(&kernel_object->lock, "kernel vm object");
vm_radix_init(&kernel_object->rtree);
_vm_object_allocate(OBJT_PHYS, atop(VM_MAX_KERNEL_ADDRESS -
VM_MIN_KERNEL_ADDRESS), OBJ_UNMANAGED, kernel_object, NULL);
#if VM_NRESERVLEVEL > 0
kernel_object->flags |= OBJ_COLORED;
kernel_object->pg_color = (u_short)atop(VM_MIN_KERNEL_ADDRESS);
#endif
kernel_object->un_pager.phys.ops = &default_phys_pg_ops;
obj_zone = uma_zcreate("VM OBJECT", sizeof (struct vm_object), NULL,
#ifdef INVARIANTS
vm_object_zdtor,
#else
NULL,
#endif
vm_object_zinit, NULL, UMA_ALIGN_PTR, UMA_ZONE_NOFREE);
vm_radix_zinit();
}
void
vm_object_clear_flag(vm_object_t object, u_short bits)
{
VM_OBJECT_ASSERT_WLOCKED(object);
object->flags &= ~bits;
}
int
vm_object_set_memattr(vm_object_t object, vm_memattr_t memattr)
{
VM_OBJECT_ASSERT_WLOCKED(object);
if (object->type == OBJT_DEAD)
return (KERN_INVALID_ARGUMENT);
if (!vm_radix_is_empty(&object->rtree))
return (KERN_FAILURE);
object->memattr = memattr;
return (KERN_SUCCESS);
}
void
vm_object_pip_add(vm_object_t object, short i)
{
if (i > 0)
blockcount_acquire(&object->paging_in_progress, i);
}
void
vm_object_pip_wakeup(vm_object_t object)
{
vm_object_pip_wakeupn(object, 1);
}
void
vm_object_pip_wakeupn(vm_object_t object, short i)
{
if (i > 0)
blockcount_release(&object->paging_in_progress, i);
}
static void
vm_object_pip_sleep(vm_object_t object, const char *waitid)
{
(void)blockcount_sleep(&object->paging_in_progress, &object->lock,
waitid, PVM | PDROP);
}
void
vm_object_pip_wait(vm_object_t object, const char *waitid)
{
VM_OBJECT_ASSERT_WLOCKED(object);
blockcount_wait(&object->paging_in_progress, &object->lock, waitid,
PVM);
}
void
vm_object_pip_wait_unlocked(vm_object_t object, const char *waitid)
{
VM_OBJECT_ASSERT_UNLOCKED(object);
blockcount_wait(&object->paging_in_progress, NULL, waitid, PVM);
}
vm_object_t
vm_object_allocate(objtype_t type, vm_pindex_t size)
{
vm_object_t object;
u_short flags;
switch (type) {
case OBJT_DEAD:
panic("vm_object_allocate: can't create OBJT_DEAD");
case OBJT_SWAP:
flags = OBJ_COLORED | OBJ_SWAP;
break;
case OBJT_DEVICE:
case OBJT_SG:
flags = OBJ_FICTITIOUS | OBJ_UNMANAGED;
break;
case OBJT_MGTDEVICE:
flags = OBJ_FICTITIOUS;
break;
case OBJT_PHYS:
flags = OBJ_UNMANAGED;
break;
case OBJT_VNODE:
flags = 0;
break;
default:
panic("vm_object_allocate: type %d is undefined or dynamic",
type);
}
object = (vm_object_t)uma_zalloc(obj_zone, M_WAITOK);
_vm_object_allocate(type, size, flags, object, NULL);
return (object);
}
vm_object_t
vm_object_allocate_dyn(objtype_t dyntype, vm_pindex_t size, u_short flags)
{
vm_object_t object;
MPASS(dyntype >= OBJT_FIRST_DYN );
object = (vm_object_t)uma_zalloc(obj_zone, M_WAITOK);
_vm_object_allocate(dyntype, size, flags, object, NULL);
return (object);
}
vm_object_t
vm_object_allocate_anon(vm_pindex_t size, vm_object_t backing_object,
struct ucred *cred, vm_size_t charge)
{
vm_object_t handle, object;
if (backing_object == NULL)
handle = NULL;
else if ((backing_object->flags & OBJ_ANON) != 0)
handle = backing_object->handle;
else
handle = backing_object;
object = uma_zalloc(obj_zone, M_WAITOK);
_vm_object_allocate(OBJT_SWAP, size,
OBJ_ANON | OBJ_ONEMAPPING | OBJ_SWAP, object, handle);
object->cred = cred;
object->charge = cred != NULL ? charge : 0;
return (object);
}
static void
vm_object_reference_vnode(vm_object_t object)
{
u_int old;
if (!refcount_acquire_if_gt(&object->ref_count, 0)) {
VM_OBJECT_RLOCK(object);
old = refcount_acquire(&object->ref_count);
if (object->type == OBJT_VNODE && old == 0)
vref(object->handle);
VM_OBJECT_RUNLOCK(object);
}
}
void
vm_object_reference(vm_object_t object)
{
if (object == NULL)
return;
if (object->type == OBJT_VNODE)
vm_object_reference_vnode(object);
else
refcount_acquire(&object->ref_count);
KASSERT((object->flags & OBJ_DEAD) == 0,
("vm_object_reference: Referenced dead object."));
}
void
vm_object_reference_locked(vm_object_t object)
{
u_int old;
VM_OBJECT_ASSERT_LOCKED(object);
old = refcount_acquire(&object->ref_count);
if (object->type == OBJT_VNODE && old == 0)
vref(object->handle);
KASSERT((object->flags & OBJ_DEAD) == 0,
("vm_object_reference: Referenced dead object."));
}
static void
vm_object_deallocate_vnode(vm_object_t object)
{
struct vnode *vp = (struct vnode *) object->handle;
bool last;
KASSERT(object->type == OBJT_VNODE,
("vm_object_deallocate_vnode: not a vnode object"));
KASSERT(vp != NULL, ("vm_object_deallocate_vnode: missing vp"));
last = refcount_release(&object->ref_count);
VM_OBJECT_RUNLOCK(object);
if (!last)
return;
if (!umtx_shm_vnobj_persistent)
umtx_shm_object_terminated(object);
vrele(vp);
}
static vm_object_t
vm_object_deallocate_anon(vm_object_t backing_object)
{
vm_object_t object;
object = LIST_FIRST(&backing_object->shadow_head);
KASSERT(object != NULL &&
atomic_load_int(&backing_object->shadow_count) == 1,
("vm_object_anon_deallocate: ref_count: %d, shadow_count: %d",
backing_object->ref_count,
atomic_load_int(&backing_object->shadow_count)));
KASSERT((object->flags & OBJ_ANON) != 0,
("invalid shadow object %p", object));
if (!VM_OBJECT_TRYWLOCK(object)) {
vm_object_pip_add(object, 1);
VM_OBJECT_WUNLOCK(backing_object);
VM_OBJECT_WLOCK(object);
vm_object_pip_wakeup(object);
} else
VM_OBJECT_WUNLOCK(backing_object);
if ((object->flags & (OBJ_DEAD | OBJ_COLLAPSING)) != 0 ||
!refcount_acquire_if_not_zero(&object->ref_count)) {
VM_OBJECT_WUNLOCK(object);
return (NULL);
}
backing_object = object->backing_object;
if (backing_object != NULL && (backing_object->flags & OBJ_ANON) != 0)
vm_object_collapse(object);
VM_OBJECT_WUNLOCK(object);
return (object);
}
void
vm_object_deallocate(vm_object_t object)
{
vm_object_t temp;
bool released;
while (object != NULL) {
if ((object->flags & OBJ_ANON) == 0)
released = refcount_release_if_gt(&object->ref_count, 1);
else
released = refcount_release_if_gt(&object->ref_count, 2);
if (released)
return;
if (object->type == OBJT_VNODE) {
VM_OBJECT_RLOCK(object);
if (object->type == OBJT_VNODE) {
vm_object_deallocate_vnode(object);
return;
}
VM_OBJECT_RUNLOCK(object);
}
VM_OBJECT_WLOCK(object);
KASSERT(object->ref_count > 0,
("vm_object_deallocate: object deallocated too many times: %d",
object->type));
if (!refcount_release(&object->ref_count)) {
if (object->ref_count > 1 ||
atomic_load_int(&object->shadow_count) == 0) {
if ((object->flags & OBJ_ANON) != 0 &&
object->ref_count == 1)
vm_object_set_flag(object,
OBJ_ONEMAPPING);
VM_OBJECT_WUNLOCK(object);
return;
}
object = vm_object_deallocate_anon(object);
continue;
}
umtx_shm_object_terminated(object);
temp = object->backing_object;
if (temp != NULL) {
KASSERT(object->type == OBJT_SWAP,
("shadowed tmpfs v_object 2 %p", object));
vm_object_backing_remove(object);
}
KASSERT((object->flags & OBJ_DEAD) == 0,
("vm_object_deallocate: Terminating dead object."));
vm_object_set_flag(object, OBJ_DEAD);
vm_object_terminate(object);
object = temp;
}
}
void
vm_object_destroy(vm_object_t object)
{
uma_zfree(obj_zone, object);
}
static void
vm_object_sub_shadow(vm_object_t object)
{
KASSERT(object->shadow_count >= 1,
("object %p sub_shadow count zero", object));
atomic_subtract_int(&object->shadow_count, 1);
}
static void
vm_object_backing_remove_locked(vm_object_t object)
{
vm_object_t backing_object;
backing_object = object->backing_object;
VM_OBJECT_ASSERT_WLOCKED(object);
VM_OBJECT_ASSERT_WLOCKED(backing_object);
KASSERT((object->flags & OBJ_COLLAPSING) == 0,
("vm_object_backing_remove: Removing collapsing object."));
vm_object_sub_shadow(backing_object);
if ((object->flags & OBJ_SHADOWLIST) != 0) {
LIST_REMOVE(object, shadow_list);
vm_object_clear_flag(object, OBJ_SHADOWLIST);
}
object->backing_object = NULL;
}
static void
vm_object_backing_remove(vm_object_t object)
{
vm_object_t backing_object;
VM_OBJECT_ASSERT_WLOCKED(object);
backing_object = object->backing_object;
if ((object->flags & OBJ_SHADOWLIST) != 0) {
VM_OBJECT_WLOCK(backing_object);
vm_object_backing_remove_locked(object);
VM_OBJECT_WUNLOCK(backing_object);
} else {
object->backing_object = NULL;
vm_object_sub_shadow(backing_object);
}
}
static void
vm_object_backing_insert_locked(vm_object_t object, vm_object_t backing_object)
{
VM_OBJECT_ASSERT_WLOCKED(object);
atomic_add_int(&backing_object->shadow_count, 1);
if ((backing_object->flags & OBJ_ANON) != 0) {
VM_OBJECT_ASSERT_WLOCKED(backing_object);
LIST_INSERT_HEAD(&backing_object->shadow_head, object,
shadow_list);
vm_object_set_flag(object, OBJ_SHADOWLIST);
}
object->backing_object = backing_object;
}
static void
vm_object_backing_insert(vm_object_t object, vm_object_t backing_object)
{
VM_OBJECT_ASSERT_WLOCKED(object);
if ((backing_object->flags & OBJ_ANON) != 0) {
VM_OBJECT_WLOCK(backing_object);
vm_object_backing_insert_locked(object, backing_object);
VM_OBJECT_WUNLOCK(backing_object);
} else {
object->backing_object = backing_object;
atomic_add_int(&backing_object->shadow_count, 1);
}
}
static void
vm_object_backing_insert_ref(vm_object_t object, vm_object_t backing_object)
{
VM_OBJECT_ASSERT_WLOCKED(object);
if ((backing_object->flags & OBJ_ANON) != 0) {
VM_OBJECT_WLOCK(backing_object);
KASSERT((backing_object->flags & OBJ_DEAD) == 0,
("shadowing dead anonymous object"));
vm_object_reference_locked(backing_object);
vm_object_backing_insert_locked(object, backing_object);
vm_object_clear_flag(backing_object, OBJ_ONEMAPPING);
VM_OBJECT_WUNLOCK(backing_object);
} else {
vm_object_reference(backing_object);
atomic_add_int(&backing_object->shadow_count, 1);
object->backing_object = backing_object;
}
}
static void
vm_object_backing_transfer(vm_object_t object, vm_object_t backing_object)
{
vm_object_t new_backing_object;
vm_object_backing_remove_locked(object);
new_backing_object = backing_object->backing_object;
if (new_backing_object == NULL)
return;
if ((new_backing_object->flags & OBJ_ANON) != 0) {
VM_OBJECT_WLOCK(new_backing_object);
vm_object_backing_remove_locked(backing_object);
vm_object_backing_insert_locked(object, new_backing_object);
VM_OBJECT_WUNLOCK(new_backing_object);
} else {
object->backing_object = new_backing_object;
backing_object->backing_object = NULL;
}
}
static void
vm_object_collapse_wait(vm_object_t object)
{
VM_OBJECT_ASSERT_WLOCKED(object);
while ((object->flags & OBJ_COLLAPSING) != 0) {
vm_object_pip_wait(object, "vmcolwait");
counter_u64_add(object_collapse_waits, 1);
}
}
static vm_object_t
vm_object_backing_collapse_wait(vm_object_t object)
{
vm_object_t backing_object;
VM_OBJECT_ASSERT_WLOCKED(object);
for (;;) {
backing_object = object->backing_object;
if (backing_object == NULL ||
(backing_object->flags & OBJ_ANON) == 0)
return (NULL);
VM_OBJECT_WLOCK(backing_object);
if ((backing_object->flags & (OBJ_DEAD | OBJ_COLLAPSING)) == 0)
break;
VM_OBJECT_WUNLOCK(object);
vm_object_pip_sleep(backing_object, "vmbckwait");
counter_u64_add(object_collapse_waits, 1);
VM_OBJECT_WLOCK(object);
}
return (backing_object);
}
static void
vm_object_terminate_single_page(vm_page_t p, void *objectv)
{
vm_object_t object __diagused = objectv;
vm_page_assert_unbusied(p);
KASSERT(p->object == object &&
(p->ref_count & VPRC_OBJREF) != 0,
("%s: page %p is inconsistent", __func__, p));
p->object = NULL;
if (vm_page_drop(p, VPRC_OBJREF) == VPRC_OBJREF) {
KASSERT((object->flags & OBJ_UNMANAGED) != 0 ||
vm_page_astate_load(p).queue != PQ_NONE,
("%s: page %p does not belong to a queue", __func__, p));
VM_CNT_INC(v_pfree);
vm_page_free(p);
}
}
static void
vm_object_terminate_pages(vm_object_t object)
{
VM_OBJECT_ASSERT_WLOCKED(object);
if (object->resident_page_count == 0)
return;
vm_radix_reclaim_callback(&object->rtree,
vm_object_terminate_single_page, object);
object->resident_page_count = 0;
if (object->type == OBJT_VNODE)
vdrop(object->handle);
}
void
vm_object_terminate(vm_object_t object)
{
VM_OBJECT_ASSERT_WLOCKED(object);
KASSERT((object->flags & OBJ_DEAD) != 0,
("terminating non-dead obj %p", object));
KASSERT((object->flags & OBJ_COLLAPSING) == 0,
("terminating collapsing obj %p", object));
KASSERT(object->backing_object == NULL,
("terminating shadow obj %p", object));
vm_object_pip_wait(object, "objtrm");
KASSERT(object->ref_count == 0,
("vm_object_terminate: object with references, ref_count=%d",
object->ref_count));
if ((object->flags & OBJ_PG_DTOR) == 0)
vm_object_terminate_pages(object);
#if VM_NRESERVLEVEL > 0
if (__predict_false(!LIST_EMPTY(&object->rvq)))
vm_reserv_break_all(object);
#endif
KASSERT(object->cred == NULL || (object->flags & OBJ_SWAP) != 0,
("%s: non-swap obj %p has cred", __func__, object));
vm_pager_deallocate(object);
VM_OBJECT_WUNLOCK(object);
vm_object_destroy(object);
}
static boolean_t
vm_object_page_remove_write(vm_page_t p, int flags, boolean_t *allclean)
{
vm_page_assert_busied(p);
if ((flags & OBJPC_NOSYNC) != 0 && (p->a.flags & PGA_NOSYNC) != 0) {
*allclean = FALSE;
return (FALSE);
} else {
pmap_remove_write(p);
return (p->dirty != 0);
}
}
static int
vm_object_page_clean_flush(struct pctrie_iter *pages, vm_page_t p,
int pagerflags, int flags, boolean_t *allclean, bool *eio)
{
vm_page_t ma[vm_pageout_page_count];
int count, runlen;
vm_page_assert_xbusied(p);
ma[0] = p;
runlen = vm_radix_iter_lookup_range(pages, p->pindex + 1,
&ma[1], vm_pageout_page_count - 1);
for (count = 1; count <= runlen; count++) {
p = ma[count];
if (vm_page_tryxbusy(p) == 0)
break;
if (!vm_object_page_remove_write(p, flags, allclean)) {
vm_page_xunbusy(p);
break;
}
}
return (vm_pageout_flush(ma, count, pagerflags, eio));
}
boolean_t
vm_object_page_clean(vm_object_t object, vm_ooffset_t start, vm_ooffset_t end,
int flags)
{
struct pctrie_iter pages;
vm_page_t np, p;
vm_pindex_t pi, tend, tstart;
int curgeneration, n, pagerflags;
boolean_t res, allclean;
bool eio;
VM_OBJECT_ASSERT_WLOCKED(object);
if (!vm_object_mightbedirty(object) || object->resident_page_count == 0)
return (TRUE);
pagerflags = (flags & (OBJPC_SYNC | OBJPC_INVAL)) != 0 ?
VM_PAGER_PUT_SYNC : VM_PAGER_CLUSTER_OK;
pagerflags |= (flags & OBJPC_INVAL) != 0 ? VM_PAGER_PUT_INVAL : 0;
tstart = OFF_TO_IDX(start);
tend = (end == 0) ? object->size : OFF_TO_IDX(end + PAGE_MASK);
allclean = tstart == 0 && tend >= object->size;
res = TRUE;
vm_page_iter_init(&pages, object);
rescan:
curgeneration = object->generation;
for (p = vm_radix_iter_lookup_ge(&pages, tstart); p != NULL; p = np) {
pi = p->pindex;
if (pi >= tend)
break;
if (vm_page_none_valid(p)) {
np = vm_radix_iter_step(&pages);
continue;
}
if (!vm_page_busy_acquire(p, VM_ALLOC_WAITFAIL)) {
pctrie_iter_reset(&pages);
if (object->generation != curgeneration &&
(flags & OBJPC_SYNC) != 0)
goto rescan;
np = vm_radix_iter_lookup_ge(&pages, pi);
continue;
}
if (!vm_object_page_remove_write(p, flags, &allclean)) {
np = vm_radix_iter_step(&pages);
vm_page_xunbusy(p);
continue;
}
if (object->type == OBJT_VNODE) {
n = vm_object_page_clean_flush(&pages, p, pagerflags,
flags, &allclean, &eio);
pctrie_iter_reset(&pages);
if (eio) {
res = FALSE;
allclean = FALSE;
}
if (object->generation != curgeneration &&
(flags & OBJPC_SYNC) != 0)
goto rescan;
if (n == 0) {
n = 1;
allclean = FALSE;
}
} else {
n = 1;
vm_page_xunbusy(p);
}
np = vm_radix_iter_lookup_ge(&pages, pi + n);
}
#if 0
VOP_FSYNC(vp, (pagerflags & VM_PAGER_PUT_SYNC) ? MNT_WAIT : 0);
#endif
if (allclean && object->type == OBJT_VNODE)
object->cleangeneration = curgeneration;
return (res);
}
boolean_t
vm_object_sync(vm_object_t object, vm_ooffset_t offset, vm_size_t size,
boolean_t syncio, boolean_t invalidate)
{
vm_object_t backing_object;
struct vnode *vp;
struct mount *mp;
int error, flags, fsync_after;
boolean_t res;
if (object == NULL)
return (TRUE);
res = TRUE;
error = 0;
VM_OBJECT_WLOCK(object);
while ((backing_object = object->backing_object) != NULL) {
VM_OBJECT_WLOCK(backing_object);
offset += object->backing_object_offset;
VM_OBJECT_WUNLOCK(object);
object = backing_object;
if (object->size < OFF_TO_IDX(offset + size))
size = IDX_TO_OFF(object->size) - offset;
}
if (object->type == OBJT_VNODE &&
vm_object_mightbedirty(object) != 0 &&
((vp = object->handle)->v_vflag & VV_NOSYNC) == 0) {
VM_OBJECT_WUNLOCK(object);
(void)vn_start_write(vp, &mp, V_WAIT);
vn_lock(vp, LK_EXCLUSIVE | LK_RETRY);
if (syncio && !invalidate && offset == 0 &&
atop(size) == object->size) {
flags = 0;
fsync_after = TRUE;
} else {
flags = (syncio || invalidate) ? OBJPC_SYNC : 0;
flags |= invalidate ? (OBJPC_SYNC | OBJPC_INVAL) : 0;
fsync_after = FALSE;
}
VM_OBJECT_WLOCK(object);
res = vm_object_page_clean(object, offset, offset + size,
flags);
VM_OBJECT_WUNLOCK(object);
if (fsync_after) {
for (;;) {
error = VOP_FSYNC(vp, MNT_WAIT, curthread);
if (error != ERELOOKUP)
break;
VOP_UNLOCK(vp);
vn_finished_write(mp);
(void)vn_start_write(vp, &mp, V_WAIT);
vn_lock(vp, LK_EXCLUSIVE | LK_RETRY);
}
}
VOP_UNLOCK(vp);
vn_finished_write(mp);
if (error != 0)
res = FALSE;
VM_OBJECT_WLOCK(object);
}
if ((object->type == OBJT_VNODE ||
object->type == OBJT_DEVICE) && invalidate) {
if (object->type == OBJT_DEVICE)
flags = OBJPR_NOTMAPPED;
else if (old_msync)
flags = 0;
else
flags = OBJPR_CLEANONLY;
vm_object_page_remove(object, OFF_TO_IDX(offset),
OFF_TO_IDX(offset + size + PAGE_MASK), flags);
}
VM_OBJECT_WUNLOCK(object);
return (res);
}
static bool
vm_object_advice_applies(vm_object_t object, int advice)
{
if ((object->flags & OBJ_UNMANAGED) != 0)
return (false);
if (advice != MADV_FREE)
return (true);
return ((object->flags & (OBJ_ONEMAPPING | OBJ_ANON)) ==
(OBJ_ONEMAPPING | OBJ_ANON));
}
static void
vm_object_madvise_freespace(vm_object_t object, int advice, vm_pindex_t pindex,
vm_size_t size)
{
if (advice == MADV_FREE)
vm_pager_freespace(object, pindex, size);
}
void
vm_object_madvise(vm_object_t object, vm_pindex_t pindex, vm_pindex_t end,
int advice)
{
struct pctrie_iter pages;
vm_pindex_t tpindex;
vm_object_t backing_object, tobject;
vm_page_t m, tm;
if (object == NULL)
return;
vm_page_iter_init(&pages, object);
relookup:
VM_OBJECT_WLOCK(object);
if (!vm_object_advice_applies(object, advice)) {
VM_OBJECT_WUNLOCK(object);
return;
}
for (m = vm_radix_iter_lookup_ge(&pages, pindex); pindex < end;
pindex++) {
tobject = object;
if (m == NULL || pindex < m->pindex) {
if (object->backing_object == NULL) {
tpindex = (m != NULL && m->pindex < end) ?
m->pindex : end;
vm_object_madvise_freespace(object, advice,
pindex, tpindex - pindex);
if ((pindex = tpindex) == end)
break;
goto next_page;
}
tpindex = pindex;
do {
vm_object_madvise_freespace(tobject, advice,
tpindex, 1);
backing_object = tobject->backing_object;
if (backing_object == NULL)
goto next_pindex;
VM_OBJECT_WLOCK(backing_object);
tpindex +=
OFF_TO_IDX(tobject->backing_object_offset);
if (tobject != object)
VM_OBJECT_WUNLOCK(tobject);
tobject = backing_object;
if (!vm_object_advice_applies(tobject, advice))
goto next_pindex;
} while ((tm = vm_page_lookup(tobject, tpindex)) ==
NULL);
} else {
next_page:
tm = m;
m = vm_radix_iter_step(&pages);
}
if (!vm_page_all_valid(tm) || vm_page_wired(tm))
goto next_pindex;
KASSERT((tm->flags & PG_FICTITIOUS) == 0,
("vm_object_madvise: page %p is fictitious", tm));
KASSERT((tm->oflags & VPO_UNMANAGED) == 0,
("vm_object_madvise: page %p is not managed", tm));
if (vm_page_tryxbusy(tm) == 0) {
if (object != tobject)
VM_OBJECT_WUNLOCK(object);
if (advice == MADV_WILLNEED) {
vm_page_aflag_set(tm, PGA_REFERENCED);
}
if (!vm_page_busy_sleep(tm, "madvpo", 0))
VM_OBJECT_WUNLOCK(tobject);
pctrie_iter_reset(&pages);
goto relookup;
}
vm_page_advise(tm, advice);
vm_page_xunbusy(tm);
vm_object_madvise_freespace(tobject, advice, tm->pindex, 1);
next_pindex:
if (tobject != object)
VM_OBJECT_WUNLOCK(tobject);
}
VM_OBJECT_WUNLOCK(object);
}
void
vm_object_shadow(vm_object_t *object, vm_ooffset_t *offset, vm_size_t length,
struct ucred *cred, bool shared)
{
vm_object_t source;
vm_object_t result;
source = *object;
if (source != NULL && source->ref_count == 1 &&
(source->flags & OBJ_ANON) != 0)
return;
result = vm_object_allocate_anon(atop(length), source, cred, length);
result->backing_object_offset = *offset;
if (shared || source != NULL) {
VM_OBJECT_WLOCK(result);
if (shared) {
vm_object_reference_locked(result);
vm_object_clear_flag(result, OBJ_ONEMAPPING);
}
if (source != NULL) {
vm_object_backing_insert(result, source);
result->domain = source->domain;
#if VM_NRESERVLEVEL > 0
vm_object_set_flag(result,
(source->flags & OBJ_COLORED));
result->pg_color = (source->pg_color +
OFF_TO_IDX(*offset)) & ((1 << (VM_NFREEORDER -
1)) - 1);
#endif
}
VM_OBJECT_WUNLOCK(result);
}
*offset = 0;
*object = result;
}
void
vm_object_split(vm_map_entry_t entry)
{
struct pctrie_iter pages;
vm_page_t m;
vm_object_t orig_object, new_object, backing_object;
vm_pindex_t offidxstart;
vm_size_t size;
orig_object = entry->object.vm_object;
KASSERT((orig_object->flags & OBJ_ONEMAPPING) != 0,
("vm_object_split: Splitting object with multiple mappings."));
if ((orig_object->flags & OBJ_ANON) == 0)
return;
if (orig_object->ref_count <= 1)
return;
VM_OBJECT_WUNLOCK(orig_object);
offidxstart = OFF_TO_IDX(entry->offset);
size = atop(entry->end - entry->start);
new_object = vm_object_allocate_anon(size, orig_object,
orig_object->cred, ptoa(size));
VM_OBJECT_WLOCK(orig_object);
vm_object_collapse_wait(orig_object);
VM_OBJECT_WLOCK(new_object);
new_object->domain = orig_object->domain;
backing_object = orig_object->backing_object;
if (backing_object != NULL) {
vm_object_backing_insert_ref(new_object, backing_object);
new_object->backing_object_offset =
orig_object->backing_object_offset + entry->offset;
}
if (orig_object->cred != NULL) {
crhold(orig_object->cred);
KASSERT(orig_object->charge >= ptoa(size),
("orig_object->charge < 0"));
orig_object->charge -= ptoa(size);
}
vm_object_set_flag(orig_object, OBJ_SPLIT);
vm_page_iter_limit_init(&pages, orig_object, offidxstart + size);
retry:
KASSERT(pctrie_iter_is_reset(&pages),
("%s: pctrie_iter not reset for retry", __func__));
for (m = vm_radix_iter_lookup_ge(&pages, offidxstart); m != NULL;
m = vm_radix_iter_step(&pages)) {
if (vm_page_tryxbusy(m) == 0) {
VM_OBJECT_WUNLOCK(new_object);
if (vm_page_busy_sleep(m, "spltwt", 0))
VM_OBJECT_WLOCK(orig_object);
pctrie_iter_reset(&pages);
VM_OBJECT_WLOCK(new_object);
goto retry;
}
if (vm_page_none_valid(m) && entry->wired_count == 0) {
if (vm_page_iter_remove(&pages, m))
vm_page_free(m);
continue;
}
if (!vm_page_iter_rename(&pages, m, new_object, m->pindex -
offidxstart)) {
vm_page_xunbusy(m);
VM_OBJECT_WUNLOCK(new_object);
VM_OBJECT_WUNLOCK(orig_object);
vm_radix_wait();
pctrie_iter_reset(&pages);
VM_OBJECT_WLOCK(orig_object);
VM_OBJECT_WLOCK(new_object);
goto retry;
}
#if VM_NRESERVLEVEL > 0
vm_reserv_rename(m, new_object, orig_object, offidxstart);
#endif
}
swap_pager_copy(orig_object, new_object, offidxstart, 0);
vm_page_iter_init(&pages, new_object);
VM_RADIX_FOREACH(m, &pages)
vm_page_xunbusy(m);
vm_object_clear_flag(orig_object, OBJ_SPLIT);
VM_OBJECT_WUNLOCK(orig_object);
VM_OBJECT_WUNLOCK(new_object);
entry->object.vm_object = new_object;
entry->offset = 0LL;
vm_object_deallocate(orig_object);
VM_OBJECT_WLOCK(new_object);
}
static vm_page_t
vm_object_collapse_scan_wait(struct pctrie_iter *pages, vm_object_t object,
vm_page_t p)
{
vm_object_t backing_object;
VM_OBJECT_ASSERT_WLOCKED(object);
backing_object = object->backing_object;
VM_OBJECT_ASSERT_WLOCKED(backing_object);
KASSERT(p == NULL || p->object == object || p->object == backing_object,
("invalid ownership %p %p %p", p, object, backing_object));
if (p == NULL) {
VM_OBJECT_WUNLOCK(object);
VM_OBJECT_WUNLOCK(backing_object);
vm_radix_wait();
VM_OBJECT_WLOCK(object);
} else if (p->object == object) {
VM_OBJECT_WUNLOCK(backing_object);
if (vm_page_busy_sleep(p, "vmocol", 0))
VM_OBJECT_WLOCK(object);
} else {
VM_OBJECT_WUNLOCK(object);
if (!vm_page_busy_sleep(p, "vmocol", 0))
VM_OBJECT_WUNLOCK(backing_object);
VM_OBJECT_WLOCK(object);
}
VM_OBJECT_WLOCK(backing_object);
vm_page_iter_init(pages, backing_object);
return (vm_radix_iter_lookup_ge(pages, 0));
}
static void
vm_object_collapse_scan(vm_object_t object)
{
struct pctrie_iter pages;
vm_object_t backing_object;
vm_page_t next, p, pp;
vm_pindex_t backing_offset_index, new_pindex;
VM_OBJECT_ASSERT_WLOCKED(object);
VM_OBJECT_ASSERT_WLOCKED(object->backing_object);
backing_object = object->backing_object;
backing_offset_index = OFF_TO_IDX(object->backing_object_offset);
vm_page_iter_init(&pages, backing_object);
for (p = vm_radix_iter_lookup_ge(&pages, 0); p != NULL; p = next) {
if (vm_page_tryxbusy(p) == 0) {
next = vm_object_collapse_scan_wait(&pages, object, p);
continue;
}
KASSERT(object->backing_object == backing_object,
("vm_object_collapse_scan: backing object mismatch %p != %p",
object->backing_object, backing_object));
KASSERT(p->object == backing_object,
("vm_object_collapse_scan: object mismatch %p != %p",
p->object, backing_object));
if (p->pindex < backing_offset_index || object->size <=
(new_pindex = p->pindex - backing_offset_index)) {
vm_pager_freespace(backing_object, p->pindex, 1);
KASSERT(!pmap_page_is_mapped(p),
("freeing mapped page %p", p));
if (vm_page_iter_remove(&pages, p))
vm_page_free(p);
next = vm_radix_iter_step(&pages);
continue;
}
if (!vm_page_all_valid(p)) {
KASSERT(!pmap_page_is_mapped(p),
("freeing mapped page %p", p));
if (vm_page_iter_remove(&pages, p))
vm_page_free(p);
next = vm_radix_iter_step(&pages);
continue;
}
pp = vm_page_lookup(object, new_pindex);
if (pp != NULL && vm_page_tryxbusy(pp) == 0) {
vm_page_xunbusy(p);
next = vm_object_collapse_scan_wait(&pages, object, pp);
continue;
}
if (pp != NULL && vm_page_none_valid(pp)) {
if (vm_page_remove(pp))
vm_page_free(pp);
pp = NULL;
}
if (pp != NULL || vm_pager_has_page(object, new_pindex, NULL,
NULL)) {
vm_pager_freespace(backing_object, p->pindex, 1);
KASSERT(!pmap_page_is_mapped(p),
("freeing mapped page %p", p));
if (pp != NULL)
vm_page_xunbusy(pp);
if (vm_page_iter_remove(&pages, p))
vm_page_free(p);
next = vm_radix_iter_step(&pages);
continue;
}
if (!vm_page_iter_rename(&pages, p, object, new_pindex)) {
vm_page_xunbusy(p);
next = vm_object_collapse_scan_wait(&pages, object,
NULL);
continue;
}
vm_pager_freespace(backing_object, new_pindex +
backing_offset_index, 1);
#if VM_NRESERVLEVEL > 0
vm_reserv_rename(p, object, backing_object,
backing_offset_index);
#endif
vm_page_xunbusy(p);
next = vm_radix_iter_step(&pages);
}
return;
}
void
vm_object_collapse(vm_object_t object)
{
vm_object_t backing_object, new_backing_object;
VM_OBJECT_ASSERT_WLOCKED(object);
while (TRUE) {
KASSERT((object->flags & (OBJ_DEAD | OBJ_ANON)) == OBJ_ANON,
("collapsing invalid object"));
backing_object = vm_object_backing_collapse_wait(object);
if (backing_object == NULL)
return;
KASSERT(object->ref_count > 0 &&
object->ref_count > atomic_load_int(&object->shadow_count),
("collapse with invalid ref %d or shadow %d count.",
object->ref_count, atomic_load_int(&object->shadow_count)));
KASSERT((backing_object->flags &
(OBJ_COLLAPSING | OBJ_DEAD)) == 0,
("vm_object_collapse: Backing object already collapsing."));
KASSERT((object->flags & (OBJ_COLLAPSING | OBJ_DEAD)) == 0,
("vm_object_collapse: object is already collapsing."));
if (backing_object->ref_count == 1) {
KASSERT(atomic_load_int(&backing_object->shadow_count)
== 1,
("vm_object_collapse: shadow_count: %d",
atomic_load_int(&backing_object->shadow_count)));
vm_object_pip_add(object, 1);
vm_object_set_flag(object, OBJ_COLLAPSING);
vm_object_pip_add(backing_object, 1);
vm_object_set_flag(backing_object, OBJ_DEAD);
vm_object_collapse_scan(object);
swap_pager_copy(backing_object, object,
OFF_TO_IDX(object->backing_object_offset), TRUE);
vm_object_clear_flag(object, OBJ_COLLAPSING);
vm_object_backing_transfer(object, backing_object);
object->backing_object_offset +=
backing_object->backing_object_offset;
VM_OBJECT_WUNLOCK(object);
vm_object_pip_wakeup(object);
KASSERT(backing_object->ref_count == 1, (
"backing_object %p was somehow re-referenced during collapse!",
backing_object));
vm_object_pip_wakeup(backing_object);
(void)refcount_release(&backing_object->ref_count);
umtx_shm_object_terminated(backing_object);
vm_object_terminate(backing_object);
counter_u64_add(object_collapses, 1);
VM_OBJECT_WLOCK(object);
} else {
if (!swap_pager_scan_all_shadowed(object)) {
VM_OBJECT_WUNLOCK(backing_object);
break;
}
vm_object_backing_remove_locked(object);
new_backing_object = backing_object->backing_object;
if (new_backing_object != NULL) {
vm_object_backing_insert_ref(object,
new_backing_object);
object->backing_object_offset +=
backing_object->backing_object_offset;
}
(void)refcount_release(&backing_object->ref_count);
KASSERT(backing_object->ref_count >= 1, (
"backing_object %p was somehow dereferenced during collapse!",
backing_object));
VM_OBJECT_WUNLOCK(backing_object);
counter_u64_add(object_bypasses, 1);
}
}
}
void
vm_object_page_remove(vm_object_t object, vm_pindex_t start, vm_pindex_t end,
int options)
{
struct pctrie_iter pages;
vm_page_t p;
VM_OBJECT_ASSERT_WLOCKED(object);
KASSERT((object->flags & OBJ_UNMANAGED) == 0 ||
(options & (OBJPR_CLEANONLY | OBJPR_NOTMAPPED)) == OBJPR_NOTMAPPED,
("vm_object_page_remove: illegal options for object %p", object));
if (object->resident_page_count == 0)
return;
vm_object_pip_add(object, 1);
vm_page_iter_limit_init(&pages, object, end);
again:
KASSERT(pctrie_iter_is_reset(&pages),
("%s: pctrie_iter not reset for retry", __func__));
for (p = vm_radix_iter_lookup_ge(&pages, start); p != NULL;
p = vm_radix_iter_step(&pages)) {
if ((options & OBJPR_VALIDONLY) != 0 && vm_page_none_valid(p))
continue;
if (vm_page_tryxbusy(p) == 0) {
if (vm_page_busy_sleep(p, "vmopar", 0))
VM_OBJECT_WLOCK(object);
pctrie_iter_reset(&pages);
goto again;
}
if ((options & OBJPR_VALIDONLY) != 0 && vm_page_none_valid(p)) {
vm_page_xunbusy(p);
continue;
}
if (vm_page_wired(p)) {
wired:
if ((options & OBJPR_NOTMAPPED) == 0 &&
object->ref_count != 0)
pmap_remove_all(p);
if ((options & OBJPR_CLEANONLY) == 0) {
vm_page_invalid(p);
vm_page_undirty(p);
}
vm_page_xunbusy(p);
continue;
}
KASSERT((p->flags & PG_FICTITIOUS) == 0,
("vm_object_page_remove: page %p is fictitious", p));
if ((options & OBJPR_CLEANONLY) != 0 &&
!vm_page_none_valid(p)) {
if ((options & OBJPR_NOTMAPPED) == 0 &&
object->ref_count != 0 &&
!vm_page_try_remove_write(p))
goto wired;
if (p->dirty != 0) {
vm_page_xunbusy(p);
continue;
}
}
if ((options & OBJPR_NOTMAPPED) == 0 &&
object->ref_count != 0 && !vm_page_try_remove_all(p))
goto wired;
vm_page_iter_free(&pages, p);
}
vm_object_pip_wakeup(object);
vm_pager_freespace(object, start, (end == 0 ? object->size : end) -
start);
}
void
vm_object_page_noreuse(vm_object_t object, vm_pindex_t start, vm_pindex_t end)
{
struct pctrie_iter pages;
vm_page_t p;
VM_OBJECT_ASSERT_LOCKED(object);
KASSERT((object->flags & (OBJ_FICTITIOUS | OBJ_UNMANAGED)) == 0,
("vm_object_page_noreuse: illegal object %p", object));
if (object->resident_page_count == 0)
return;
vm_page_iter_limit_init(&pages, object, end);
VM_RADIX_FOREACH_FROM(p, &pages, start)
vm_page_deactivate_noreuse(p);
}
boolean_t
vm_object_populate(vm_object_t object, vm_pindex_t start, vm_pindex_t end)
{
struct pctrie_iter pages;
vm_page_t m;
vm_pindex_t pindex;
int rv;
vm_page_iter_init(&pages, object);
VM_OBJECT_ASSERT_WLOCKED(object);
for (pindex = start; pindex < end; pindex++) {
rv = vm_page_grab_valid_iter(&m, object, pindex,
VM_ALLOC_NORMAL, &pages);
if (rv != VM_PAGER_OK)
break;
}
if (pindex > start) {
pages.limit = pindex;
VM_RADIX_FORALL_FROM(m, &pages, start)
vm_page_xunbusy(m);
}
return (pindex == end);
}
boolean_t
vm_object_coalesce(vm_object_t prev_object, vm_ooffset_t prev_offset,
vm_size_t prev_size, vm_size_t next_size, boolean_t reserved)
{
vm_pindex_t next_pindex;
if (prev_object == NULL)
return (TRUE);
if ((prev_object->flags & OBJ_ANON) == 0)
return (FALSE);
VM_OBJECT_WLOCK(prev_object);
vm_object_collapse(prev_object);
if (prev_object->backing_object != NULL) {
VM_OBJECT_WUNLOCK(prev_object);
return (FALSE);
}
prev_size >>= PAGE_SHIFT;
next_size >>= PAGE_SHIFT;
next_pindex = OFF_TO_IDX(prev_offset) + prev_size;
if (prev_object->ref_count > 1 &&
prev_object->size != next_pindex &&
(prev_object->flags & OBJ_ONEMAPPING) == 0) {
VM_OBJECT_WUNLOCK(prev_object);
return (FALSE);
}
if (prev_object->cred != NULL) {
if (!reserved && !swap_reserve_by_cred(ptoa(next_size),
prev_object->cred)) {
VM_OBJECT_WUNLOCK(prev_object);
return (FALSE);
}
prev_object->charge += ptoa(next_size);
}
if (next_pindex < prev_object->size) {
vm_object_page_remove(prev_object, next_pindex, next_pindex +
next_size, 0);
#if 0
if (prev_object->cred != NULL) {
KASSERT(prev_object->charge >=
ptoa(prev_object->size - next_pindex),
("object %p overcharged 1 %jx %jx", prev_object,
(uintmax_t)next_pindex, (uintmax_t)next_size));
prev_object->charge -= ptoa(prev_object->size -
next_pindex);
}
#endif
}
if (next_pindex + next_size > prev_object->size)
prev_object->size = next_pindex + next_size;
VM_OBJECT_WUNLOCK(prev_object);
return (TRUE);
}
void
vm_object_prepare_buf_pages(vm_object_t object, vm_page_t *ma_dst, int count,
int *rbehind, int *rahead, vm_page_t *ma_src)
{
struct pctrie_iter pages;
vm_pindex_t pindex;
vm_page_t m, mpred, msucc;
vm_page_iter_init(&pages, object);
VM_OBJECT_ASSERT_LOCKED(object);
if (*rbehind != 0) {
m = ma_src[0];
pindex = m->pindex;
mpred = vm_radix_iter_lookup_lt(&pages, pindex);
*rbehind = MIN(*rbehind,
pindex - (mpred != NULL ? mpred->pindex + 1 : 0));
for (int i = 0; i < *rbehind; i++) {
m = vm_page_alloc_iter(object, pindex - i - 1,
VM_ALLOC_NORMAL, &pages);
if (m == NULL) {
for (int j = 0; j < i; j++)
ma_dst[j] = ma_dst[j + *rbehind - i];
*rbehind = i;
*rahead = 0;
break;
}
ma_dst[*rbehind - i - 1] = m;
}
}
for (int i = 0; i < count; i++)
ma_dst[*rbehind + i] = ma_src[i];
if (*rahead != 0) {
m = ma_src[count - 1];
pindex = m->pindex + 1;
msucc = vm_radix_iter_lookup_ge(&pages, pindex);
*rahead = MIN(*rahead,
(msucc != NULL ? msucc->pindex : object->size) - pindex);
for (int i = 0; i < *rahead; i++) {
m = vm_page_alloc_iter(object, pindex + i,
VM_ALLOC_NORMAL, &pages);
if (m == NULL) {
*rahead = i;
break;
}
ma_dst[*rbehind + count + i] = m;
}
}
}
void
vm_object_set_writeable_dirty_(vm_object_t object)
{
atomic_add_int(&object->generation, 1);
}
bool
vm_object_mightbedirty_(vm_object_t object)
{
return (object->generation != object->cleangeneration);
}
void
vm_object_unwire(vm_object_t object, vm_ooffset_t offset, vm_size_t length,
uint8_t queue)
{
struct pctrie_iter pages;
vm_object_t tobject, t1object;
vm_page_t m, tm;
vm_pindex_t end_pindex, pindex, tpindex;
int depth, locked_depth;
KASSERT((offset & PAGE_MASK) == 0,
("vm_object_unwire: offset is not page aligned"));
KASSERT((length & PAGE_MASK) == 0,
("vm_object_unwire: length is not a multiple of PAGE_SIZE"));
if ((object->flags & OBJ_FICTITIOUS) != 0)
return;
pindex = OFF_TO_IDX(offset);
end_pindex = pindex + atop(length);
vm_page_iter_init(&pages, object);
again:
locked_depth = 1;
VM_OBJECT_RLOCK(object);
m = vm_radix_iter_lookup_ge(&pages, pindex);
while (pindex < end_pindex) {
if (m == NULL || pindex < m->pindex) {
tobject = object;
tpindex = pindex;
depth = 0;
do {
tpindex +=
OFF_TO_IDX(tobject->backing_object_offset);
tobject = tobject->backing_object;
KASSERT(tobject != NULL,
("vm_object_unwire: missing page"));
if ((tobject->flags & OBJ_FICTITIOUS) != 0)
goto next_page;
depth++;
if (depth == locked_depth) {
locked_depth++;
VM_OBJECT_RLOCK(tobject);
}
} while ((tm = vm_page_lookup(tobject, tpindex)) ==
NULL);
} else {
tm = m;
m = vm_radix_iter_step(&pages);
}
if (vm_page_trysbusy(tm) == 0) {
for (tobject = object; locked_depth >= 1;
locked_depth--) {
t1object = tobject->backing_object;
if (tm->object != tobject)
VM_OBJECT_RUNLOCK(tobject);
tobject = t1object;
}
tobject = tm->object;
if (!vm_page_busy_sleep(tm, "unwbo",
VM_ALLOC_IGN_SBUSY))
VM_OBJECT_RUNLOCK(tobject);
pctrie_iter_reset(&pages);
goto again;
}
vm_page_unwire(tm, queue);
vm_page_sunbusy(tm);
next_page:
pindex++;
}
for (tobject = object; locked_depth >= 1; locked_depth--) {
t1object = tobject->backing_object;
VM_OBJECT_RUNLOCK(tobject);
tobject = t1object;
}
}
struct vnode *
vm_object_vnode(vm_object_t object)
{
struct vnode *vp;
VM_OBJECT_ASSERT_LOCKED(object);
vm_pager_getvp(object, &vp, NULL);
return (vp);
}
void
vm_object_busy(vm_object_t obj)
{
VM_OBJECT_ASSERT_LOCKED(obj);
blockcount_acquire(&obj->busy, 1);
atomic_thread_fence_acq_rel();
}
void
vm_object_unbusy(vm_object_t obj)
{
blockcount_release(&obj->busy, 1);
}
void
vm_object_busy_wait(vm_object_t obj, const char *wmesg)
{
VM_OBJECT_ASSERT_UNLOCKED(obj);
(void)blockcount_sleep(&obj->busy, NULL, wmesg, PVM);
}
bool
vm_object_is_active(vm_object_t obj)
{
return (obj->ref_count > atomic_load_int(&obj->shadow_count));
}
static int
vm_object_list_handler(struct sysctl_req *req, bool swap_only)
{
struct pctrie_iter pages;
struct kinfo_vmobject *kvo;
char *fullpath, *freepath;
struct vnode *vp;
struct vattr va;
vm_object_t obj;
vm_page_t m;
u_long sp;
int count, error;
key_t key;
unsigned short seq;
bool want_path;
if (req->oldptr == NULL) {
mtx_lock(&vm_object_list_mtx);
count = 0;
TAILQ_FOREACH(obj, &vm_object_list, object_list) {
if (obj->type == OBJT_DEAD)
continue;
count++;
}
mtx_unlock(&vm_object_list_mtx);
return (SYSCTL_OUT(req, NULL, sizeof(struct kinfo_vmobject) *
count * 11 / 10));
}
want_path = !(swap_only || jailed(curthread->td_ucred));
kvo = malloc(sizeof(*kvo), M_TEMP, M_WAITOK | M_ZERO);
error = 0;
mtx_lock(&vm_object_list_mtx);
TAILQ_FOREACH(obj, &vm_object_list, object_list) {
if (obj->type == OBJT_DEAD ||
(swap_only && (obj->flags & (OBJ_ANON | OBJ_SWAP)) == 0))
continue;
VM_OBJECT_RLOCK(obj);
if (obj->type == OBJT_DEAD ||
(swap_only && (obj->flags & (OBJ_ANON | OBJ_SWAP)) == 0)) {
VM_OBJECT_RUNLOCK(obj);
continue;
}
mtx_unlock(&vm_object_list_mtx);
kvo->kvo_size = ptoa(obj->size);
kvo->kvo_resident = obj->resident_page_count;
kvo->kvo_ref_count = obj->ref_count;
kvo->kvo_shadow_count = atomic_load_int(&obj->shadow_count);
kvo->kvo_memattr = obj->memattr;
kvo->kvo_active = 0;
kvo->kvo_inactive = 0;
kvo->kvo_laundry = 0;
kvo->kvo_flags = 0;
if (!swap_only) {
vm_page_iter_init(&pages, obj);
VM_RADIX_FOREACH(m, &pages) {
if (vm_page_active(m))
kvo->kvo_active++;
else if (vm_page_inactive(m))
kvo->kvo_inactive++;
else if (vm_page_in_laundry(m))
kvo->kvo_laundry++;
}
}
kvo->kvo_vn_fileid = 0;
kvo->kvo_vn_fsid = 0;
kvo->kvo_vn_fsid_freebsd11 = 0;
freepath = NULL;
fullpath = "";
vp = NULL;
kvo->kvo_type = vm_object_kvme_type(obj, want_path ? &vp :
NULL);
if (vp != NULL) {
vref(vp);
} else if ((obj->flags & OBJ_ANON) != 0) {
MPASS(kvo->kvo_type == KVME_TYPE_SWAP);
kvo->kvo_me = (uintptr_t)obj;
kvo->kvo_backing_obj = (uintptr_t)obj->backing_object;
sp = swap_pager_swapped_pages(obj);
kvo->kvo_swapped = sp > UINT32_MAX ? UINT32_MAX : sp;
}
if (obj->type == OBJT_DEVICE || obj->type == OBJT_MGTDEVICE) {
cdev_pager_get_path(obj, kvo->kvo_path,
sizeof(kvo->kvo_path));
}
VM_OBJECT_RUNLOCK(obj);
if ((obj->flags & OBJ_SYSVSHM) != 0) {
kvo->kvo_flags |= KVMO_FLAG_SYSVSHM;
shmobjinfo(obj, &key, &seq);
kvo->kvo_vn_fileid = key;
kvo->kvo_vn_fsid_freebsd11 = seq;
}
if ((obj->flags & OBJ_POSIXSHM) != 0) {
kvo->kvo_flags |= KVMO_FLAG_POSIXSHM;
shm_get_path(obj, kvo->kvo_path,
sizeof(kvo->kvo_path));
}
if (vp != NULL) {
vn_fullpath(vp, &fullpath, &freepath);
vn_lock(vp, LK_SHARED | LK_RETRY);
if (VOP_GETATTR(vp, &va, curthread->td_ucred) == 0) {
kvo->kvo_vn_fileid = va.va_fileid;
kvo->kvo_vn_fsid = va.va_fsid;
kvo->kvo_vn_fsid_freebsd11 = va.va_fsid;
}
vput(vp);
strlcpy(kvo->kvo_path, fullpath, sizeof(kvo->kvo_path));
free(freepath, M_TEMP);
}
kvo->kvo_structsize = offsetof(struct kinfo_vmobject, kvo_path)
+ strlen(kvo->kvo_path) + 1;
kvo->kvo_structsize = roundup(kvo->kvo_structsize,
sizeof(uint64_t));
error = SYSCTL_OUT(req, kvo, kvo->kvo_structsize);
maybe_yield();
mtx_lock(&vm_object_list_mtx);
if (error)
break;
}
mtx_unlock(&vm_object_list_mtx);
free(kvo, M_TEMP);
return (error);
}
static int
sysctl_vm_object_list(SYSCTL_HANDLER_ARGS)
{
return (vm_object_list_handler(req, false));
}
SYSCTL_PROC(_vm, OID_AUTO, objects, CTLTYPE_STRUCT | CTLFLAG_RW | CTLFLAG_SKIP |
CTLFLAG_MPSAFE, NULL, 0, sysctl_vm_object_list, "S,kinfo_vmobject",
"List of VM objects");
static int
sysctl_vm_object_list_swap(SYSCTL_HANDLER_ARGS)
{
return (vm_object_list_handler(req, true));
}
SYSCTL_PROC(_vm, OID_AUTO, swap_objects,
CTLTYPE_STRUCT | CTLFLAG_RW | CTLFLAG_SKIP | CTLFLAG_MPSAFE, NULL, 0,
sysctl_vm_object_list_swap, "S,kinfo_vmobject",
"List of swap VM objects");
#include "opt_ddb.h"
#ifdef DDB
#include <sys/kernel.h>
#include <sys/cons.h>
#include <ddb/ddb.h>
static int
_vm_object_in_map(vm_map_t map, vm_object_t object, vm_map_entry_t entry)
{
vm_map_t tmpm;
vm_map_entry_t tmpe;
vm_object_t obj;
if (map == 0)
return 0;
if (entry == 0) {
VM_MAP_ENTRY_FOREACH(tmpe, map) {
if (_vm_object_in_map(map, object, tmpe)) {
return 1;
}
}
} else if (entry->eflags & MAP_ENTRY_IS_SUB_MAP) {
tmpm = entry->object.sub_map;
VM_MAP_ENTRY_FOREACH(tmpe, tmpm) {
if (_vm_object_in_map(tmpm, object, tmpe)) {
return 1;
}
}
} else if ((obj = entry->object.vm_object) != NULL) {
for (; obj; obj = obj->backing_object)
if (obj == object) {
return 1;
}
}
return 0;
}
static int
vm_object_in_map(vm_object_t object)
{
struct proc *p;
FOREACH_PROC_IN_SYSTEM(p) {
if (!p->p_vmspace )
continue;
if (_vm_object_in_map(&p->p_vmspace->vm_map, object, 0)) {
return 1;
}
}
if (_vm_object_in_map(kernel_map, object, 0))
return 1;
return 0;
}
DB_SHOW_COMMAND_FLAGS(vmochk, vm_object_check, DB_CMD_MEMSAFE)
{
vm_object_t object;
TAILQ_FOREACH(object, &vm_object_list, object_list) {
if ((object->flags & OBJ_ANON) != 0) {
if (object->ref_count == 0) {
db_printf(
"vmochk: internal obj has zero ref count: %lu\n",
(u_long)object->size);
}
if (!vm_object_in_map(object)) {
db_printf(
"vmochk: internal obj is not in a map: "
"ref: %d, size: %lu: 0x%lx, backing_object: %p\n",
object->ref_count, (u_long)object->size,
(u_long)object->size,
(void *)object->backing_object);
}
}
if (db_pager_quit)
return;
}
}
DB_SHOW_COMMAND(object, vm_object_print_static)
{
struct pctrie_iter pages;
vm_object_t object = (vm_object_t)addr;
boolean_t full = have_addr;
vm_page_t p;
#define count was_count
int count;
if (object == NULL)
return;
db_iprintf("Object %p: type=%d, size=0x%jx, res=%d, ref=%d, flags=0x%x",
object, (int)object->type, (uintmax_t)object->size,
object->resident_page_count, object->ref_count, object->flags);
db_iprintf(" ruid %d charge %jx\n",
object->cred ? object->cred->cr_ruid : -1,
(uintmax_t)object->charge);
db_iprintf(" sref=%d, backing_object(%d)=(%p)+0x%jx\n",
atomic_load_int(&object->shadow_count),
object->backing_object ? object->backing_object->ref_count : 0,
object->backing_object, (uintmax_t)object->backing_object_offset);
if (!full)
return;
db_indent += 2;
count = 0;
vm_page_iter_init(&pages, object);
VM_RADIX_FOREACH(p, &pages) {
if (count == 0)
db_iprintf("memory:=");
else if (count == 6) {
db_printf("\n");
db_iprintf(" ...");
count = 0;
} else
db_printf(",");
count++;
db_printf("(off=0x%jx,page=0x%jx)",
(uintmax_t)p->pindex, (uintmax_t)VM_PAGE_TO_PHYS(p));
if (db_pager_quit)
break;
}
if (count != 0)
db_printf("\n");
db_indent -= 2;
}
#undef count
void
vm_object_print(
long addr,
boolean_t have_addr,
long count,
char *modif)
{
vm_object_print_static(addr, have_addr, count, modif);
}
DB_SHOW_COMMAND_FLAGS(vmopag, vm_object_print_pages, DB_CMD_MEMSAFE)
{
struct pctrie_iter pages;
vm_object_t object;
vm_page_t m, start_m;
int rcount;
TAILQ_FOREACH(object, &vm_object_list, object_list) {
db_printf("new object: %p\n", (void *)object);
if (db_pager_quit)
return;
start_m = NULL;
vm_page_iter_init(&pages, object);
VM_RADIX_FOREACH(m, &pages) {
if (start_m == NULL) {
start_m = m;
rcount = 0;
} else if (start_m->pindex + rcount != m->pindex ||
VM_PAGE_TO_PHYS(start_m) + ptoa(rcount) !=
VM_PAGE_TO_PHYS(m)) {
db_printf(" index(%ld)run(%d)pa(0x%lx)\n",
(long)start_m->pindex, rcount,
(long)VM_PAGE_TO_PHYS(start_m));
if (db_pager_quit)
return;
start_m = m;
rcount = 0;
}
rcount++;
}
if (start_m != NULL) {
db_printf(" index(%ld)run(%d)pa(0x%lx)\n",
(long)start_m->pindex, rcount,
(long)VM_PAGE_TO_PHYS(start_m));
if (db_pager_quit)
return;
}
}
}
#endif