root/sys/compat/linuxkpi/common/include/linux/mm.h
/*-
 * Copyright (c) 2010 Isilon Systems, Inc.
 * Copyright (c) 2010 iX Systems, Inc.
 * Copyright (c) 2010 Panasas, Inc.
 * Copyright (c) 2013-2017 Mellanox Technologies, Ltd.
 * Copyright (c) 2015 François Tigeot
 * Copyright (c) 2015 Matthew Dillon <dillon@backplane.com>
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice unmodified, this list of conditions, and the following
 *    disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 *
 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 */
#ifndef _LINUXKPI_LINUX_MM_H_
#define _LINUXKPI_LINUX_MM_H_

#include <linux/spinlock.h>
#include <linux/gfp.h>
#include <linux/kernel.h>
#include <linux/mm_types.h>
#include <linux/mmzone.h>
#include <linux/pfn.h>
#include <linux/list.h>
#include <linux/mmap_lock.h>
#include <linux/overflow.h>
#include <linux/shrinker.h>
#include <linux/page.h>

#include <asm/pgtable.h>

#define PAGE_ALIGN(x)   ALIGN(x, PAGE_SIZE)

/*
 * Make sure our LinuxKPI defined virtual memory flags don't conflict
 * with the ones defined by FreeBSD:
 */
CTASSERT((VM_PROT_ALL & -(1 << 8)) == 0);

#define VM_READ                 VM_PROT_READ
#define VM_WRITE                VM_PROT_WRITE
#define VM_EXEC                 VM_PROT_EXECUTE

#define VM_ACCESS_FLAGS         (VM_READ | VM_WRITE | VM_EXEC)

#define VM_PFNINTERNAL          (1 << 8)        /* FreeBSD private flag to vm_insert_pfn() */
#define VM_MIXEDMAP             (1 << 9)
#define VM_NORESERVE            (1 << 10)
#define VM_PFNMAP               (1 << 11)
#define VM_IO                   (1 << 12)
#define VM_MAYWRITE             (1 << 13)
#define VM_DONTCOPY             (1 << 14)
#define VM_DONTEXPAND           (1 << 15)
#define VM_DONTDUMP             (1 << 16)
#define VM_SHARED               (1 << 17)

#define VMA_MAX_PREFAULT_RECORD 1

#define FOLL_WRITE              (1 << 0)
#define FOLL_FORCE              (1 << 1)

#define VM_FAULT_OOM            (1 << 0)
#define VM_FAULT_SIGBUS         (1 << 1)
#define VM_FAULT_MAJOR          (1 << 2)
#define VM_FAULT_WRITE          (1 << 3)
#define VM_FAULT_HWPOISON       (1 << 4)
#define VM_FAULT_HWPOISON_LARGE (1 << 5)
#define VM_FAULT_SIGSEGV        (1 << 6)
#define VM_FAULT_NOPAGE         (1 << 7)
#define VM_FAULT_LOCKED         (1 << 8)
#define VM_FAULT_RETRY          (1 << 9)
#define VM_FAULT_FALLBACK       (1 << 10)

#define VM_FAULT_ERROR (VM_FAULT_OOM | VM_FAULT_SIGBUS | VM_FAULT_SIGSEGV | \
        VM_FAULT_HWPOISON |VM_FAULT_HWPOISON_LARGE | VM_FAULT_FALLBACK)

#define FAULT_FLAG_WRITE        (1 << 0)
#define FAULT_FLAG_MKWRITE      (1 << 1)
#define FAULT_FLAG_ALLOW_RETRY  (1 << 2)
#define FAULT_FLAG_RETRY_NOWAIT (1 << 3)
#define FAULT_FLAG_KILLABLE     (1 << 4)
#define FAULT_FLAG_TRIED        (1 << 5)
#define FAULT_FLAG_USER         (1 << 6)
#define FAULT_FLAG_REMOTE       (1 << 7)
#define FAULT_FLAG_INSTRUCTION  (1 << 8)

#define fault_flag_allow_retry_first(flags) \
        (((flags) & (FAULT_FLAG_ALLOW_RETRY | FAULT_FLAG_TRIED)) == FAULT_FLAG_ALLOW_RETRY)

typedef int (*pte_fn_t)(linux_pte_t *, unsigned long addr, void *data);

struct vm_area_struct {
        vm_offset_t vm_start;
        vm_offset_t vm_end;
        vm_offset_t vm_pgoff;
        pgprot_t vm_page_prot;
        unsigned long vm_flags;
        struct mm_struct *vm_mm;
        void   *vm_private_data;
        const struct vm_operations_struct *vm_ops;
        struct linux_file *vm_file;

        /* internal operation */
        vm_paddr_t vm_pfn;              /* PFN for memory map */
        vm_size_t vm_len;               /* length for memory map */
        vm_pindex_t vm_pfn_first;
        int     vm_pfn_count;
        int    *vm_pfn_pcount;
        vm_object_t vm_obj;
        vm_map_t vm_cached_map;
        TAILQ_ENTRY(vm_area_struct) vm_entry;
};

struct vm_fault {
        unsigned int flags;
        pgoff_t pgoff;
        union {
                /* user-space address */
                void *virtual_address;  /* < 4.11 */
                unsigned long address;  /* >= 4.11 */
        };
        struct page *page;
        struct vm_area_struct *vma;
};

struct vm_operations_struct {
        void    (*open) (struct vm_area_struct *);
        void    (*close) (struct vm_area_struct *);
        int     (*fault) (struct vm_fault *);
        int     (*access) (struct vm_area_struct *, unsigned long, void *, int, int);
};

struct sysinfo {
        uint64_t totalram;      /* Total usable main memory size */
        uint64_t freeram;       /* Available memory size */
        uint64_t totalhigh;     /* Total high memory size */
        uint64_t freehigh;      /* Available high memory size */
        uint32_t mem_unit;      /* Memory unit size in bytes */
};

static inline struct page *
virt_to_head_page(const void *p)
{

        return (virt_to_page(p));
}

static inline struct folio *
virt_to_folio(const void *p)
{
        struct page *page = virt_to_page(p);

        return (page_folio(page));
}

/*
 * Compute log2 of the power of two rounded up count of pages
 * needed for size bytes.
 */
static inline int
get_order(unsigned long size)
{
        int order;

        size = (size - 1) >> PAGE_SHIFT;
        order = 0;
        while (size) {
                order++;
                size >>= 1;
        }
        return (order);
}

/*
 * Resolve a page into a virtual address:
 *
 * NOTE: This function only works for pages allocated by the kernel.
 */
void *linux_page_address(const struct page *);
#define page_address(page) linux_page_address(page)

static inline void *
lowmem_page_address(struct page *page)
{
        return (page_address(page));
}

/*
 * This only works via memory map operations.
 */
static inline int
io_remap_pfn_range(struct vm_area_struct *vma,
    unsigned long addr, unsigned long pfn, unsigned long size,
    vm_memattr_t prot)
{
        vma->vm_page_prot = prot;
        vma->vm_pfn = pfn;
        vma->vm_len = size;

        return (0);
}

vm_fault_t
lkpi_vmf_insert_pfn_prot_locked(struct vm_area_struct *vma, unsigned long addr,
    unsigned long pfn, pgprot_t prot);

static inline vm_fault_t
vmf_insert_pfn_prot(struct vm_area_struct *vma, unsigned long addr,
    unsigned long pfn, pgprot_t prot)
{
        vm_fault_t ret;

        VM_OBJECT_WLOCK(vma->vm_obj);
        ret = lkpi_vmf_insert_pfn_prot_locked(vma, addr, pfn, prot);
        VM_OBJECT_WUNLOCK(vma->vm_obj);

        return (ret);
}
#define vmf_insert_pfn_prot(...)        \
        _Static_assert(false,           \
"This function is always called in a loop. Consider using the locked version")

static inline int
apply_to_page_range(struct mm_struct *mm, unsigned long address,
    unsigned long size, pte_fn_t fn, void *data)
{
        return (-ENOTSUP);
}

int zap_vma_ptes(struct vm_area_struct *vma, unsigned long address,
    unsigned long size);

int lkpi_remap_pfn_range(struct vm_area_struct *vma,
    unsigned long start_addr, unsigned long start_pfn, unsigned long size,
    pgprot_t prot);

static inline int
remap_pfn_range(struct vm_area_struct *vma, unsigned long addr,
    unsigned long pfn, unsigned long size, pgprot_t prot)
{
        return (lkpi_remap_pfn_range(vma, addr, pfn, size, prot));
}

static inline unsigned long
vma_pages(struct vm_area_struct *vma)
{
        return ((vma->vm_end - vma->vm_start) >> PAGE_SHIFT);
}

#define offset_in_page(off)     ((unsigned long)(off) & (PAGE_SIZE - 1))

static inline void
set_page_dirty(struct page *page)
{
        vm_page_dirty(page);
}

static inline void
mark_page_accessed(struct page *page)
{
        vm_page_reference(page);
}

static inline void
get_page(struct page *page)
{
        vm_page_wire(page);
}

static inline void
put_page(struct page *page)
{
        /* `__free_page()` takes care of the refcounting (unwire). */
        __free_page(page);
}

static inline void
folio_get(struct folio *folio)
{
        get_page(&folio->page);
}

static inline void
folio_put(struct folio *folio)
{
        put_page(&folio->page);
}

/*
 * Linux uses the following "transparent" union so that `release_pages()`
 * accepts both a list of `struct page` or a list of `struct folio`. This
 * relies on the fact that a `struct folio` can be cast to a `struct page`.
 */
typedef union {
        struct page **pages;
        struct folio **folios;
} release_pages_arg __attribute__ ((__transparent_union__));

void linux_release_pages(release_pages_arg arg, int nr);
#define release_pages(arg, nr) linux_release_pages((arg), (nr))

extern long
lkpi_get_user_pages(unsigned long start, unsigned long nr_pages,
    unsigned int gup_flags, struct page **);
#if defined(LINUXKPI_VERSION) && LINUXKPI_VERSION >= 60500
#define get_user_pages(start, nr_pages, gup_flags, pages)       \
        lkpi_get_user_pages(start, nr_pages, gup_flags, pages)
#else
#define get_user_pages(start, nr_pages, gup_flags, pages, vmas) \
        lkpi_get_user_pages(start, nr_pages, gup_flags, pages)
#endif

#if defined(LINUXKPI_VERSION) && LINUXKPI_VERSION >= 60500
static inline long
pin_user_pages(unsigned long start, unsigned long nr_pages,
    unsigned int gup_flags, struct page **pages)
{
        return (get_user_pages(start, nr_pages, gup_flags, pages));
}
#else
static inline long
pin_user_pages(unsigned long start, unsigned long nr_pages,
    unsigned int gup_flags, struct page **pages,
    struct vm_area_struct **vmas)
{
        return (get_user_pages(start, nr_pages, gup_flags, pages, vmas));
}
#endif

extern int
__get_user_pages_fast(unsigned long start, int nr_pages, int write,
    struct page **);

static inline int
pin_user_pages_fast(unsigned long start, int nr_pages,
    unsigned int gup_flags, struct page **pages)
{
        return __get_user_pages_fast(
            start, nr_pages, !!(gup_flags & FOLL_WRITE), pages);
}

extern long
get_user_pages_remote(struct task_struct *, struct mm_struct *,
    unsigned long start, unsigned long nr_pages,
    unsigned int gup_flags, struct page **,
    struct vm_area_struct **);

static inline long
pin_user_pages_remote(struct task_struct *task, struct mm_struct *mm,
    unsigned long start, unsigned long nr_pages,
    unsigned int gup_flags, struct page **pages,
    struct vm_area_struct **vmas)
{
        return get_user_pages_remote(
            task, mm, start, nr_pages, gup_flags, pages, vmas);
}

#define unpin_user_page(page) put_page(page)
#define unpin_user_pages(pages, npages) release_pages(pages, npages)

#define copy_highpage(to, from) pmap_copy_page(from, to)

static inline pgprot_t
vm_get_page_prot(unsigned long vm_flags)
{
        return (vm_flags & VM_PROT_ALL);
}

static inline void
vm_flags_set(struct vm_area_struct *vma, unsigned long flags)
{
        vma->vm_flags |= flags;
}

static inline void
vm_flags_clear(struct vm_area_struct *vma, unsigned long flags)
{
        vma->vm_flags &= ~flags;
}

static inline struct page *
vmalloc_to_page(const void *addr)
{
        vm_paddr_t paddr;

        paddr = pmap_kextract((vm_offset_t)addr);
        return (PHYS_TO_VM_PAGE(paddr));
}

static inline int
trylock_page(struct page *page)
{
        return (vm_page_tryxbusy(page));
}

static inline void
unlock_page(struct page *page)
{

        vm_page_xunbusy(page);
}

extern int is_vmalloc_addr(const void *addr);
void si_meminfo(struct sysinfo *si);

static inline unsigned long
totalram_pages(void)
{
        return ((unsigned long)physmem);
}

#define unmap_mapping_range(...)        lkpi_unmap_mapping_range(__VA_ARGS__)
void lkpi_unmap_mapping_range(void *obj, loff_t const holebegin __unused,
    loff_t const holelen, int even_cows __unused);

#define PAGE_ALIGNED(p) __is_aligned(p, PAGE_SIZE)

void vma_set_file(struct vm_area_struct *vma, struct linux_file *file);

static inline void
might_alloc(gfp_t gfp_mask __unused)
{
}

#define is_cow_mapping(flags)   (false)

static inline bool
want_init_on_free(void)
{
        return (false);
}

static inline unsigned long
folio_pfn(struct folio *folio)
{
        return (page_to_pfn(&folio->page));
}

static inline long
folio_nr_pages(struct folio *folio)
{
        return (1);
}

static inline size_t
folio_size(struct folio *folio)
{
        return (PAGE_SIZE);
}

static inline void
folio_mark_dirty(struct folio *folio)
{
        set_page_dirty(&folio->page);
}

static inline void *
folio_address(const struct folio *folio)
{
        return (page_address(&folio->page));
}

#endif                                  /* _LINUXKPI_LINUX_MM_H_ */