blob: 74ebb92b625ad35d39ca12cf22067d69a1796c22 [file] [log] [blame]
Matthew Wilcoxc94c2ac2015-09-08 14:58:40 -07001#ifndef _LINUX_DAX_H
2#define _LINUX_DAX_H
3
4#include <linux/fs.h>
5#include <linux/mm.h>
Jan Kara4f622932016-05-12 18:29:17 +02006#include <linux/radix-tree.h>
Matthew Wilcoxc94c2ac2015-09-08 14:58:40 -07007#include <asm/pgtable.h>
8
Christoph Hellwiga254e562016-09-19 11:24:49 +10009struct iomap_ops;
Dan Williams6568b082017-01-24 18:44:18 -080010struct dax_device;
11struct dax_operations {
12 /*
13 * direct_access: translate a device-relative
14 * logical-page-offset into an absolute physical pfn. Return the
15 * number of pages available for DAX at that pfn.
16 */
17 long (*direct_access)(struct dax_device *, pgoff_t, long,
18 void **, pfn_t *);
19};
Christoph Hellwiga254e562016-09-19 11:24:49 +100020
Dan Williams7b6be842017-04-11 09:49:49 -070021int dax_read_lock(void);
22void dax_read_unlock(int id);
Dan Williams72058002017-04-19 15:14:31 -070023struct dax_device *dax_get_by_host(const char *host);
Dan Williams7b6be842017-04-11 09:49:49 -070024
Ross Zwislerfa28f722016-11-08 11:33:35 +110025/*
Ross Zwisler642261a2016-11-08 11:34:45 +110026 * We use lowest available bit in exceptional entry for locking, one bit for
27 * the entry size (PMD) and two more to tell us if the entry is a huge zero
28 * page (HZP) or an empty entry that is just used for locking. In total four
29 * special bits.
30 *
31 * If the PMD bit isn't set the entry has size PAGE_SIZE, and if the HZP and
32 * EMPTY bits aren't set the entry is a normal DAX entry with a filesystem
33 * block allocation.
Ross Zwislerfa28f722016-11-08 11:33:35 +110034 */
Ross Zwisler642261a2016-11-08 11:34:45 +110035#define RADIX_DAX_SHIFT (RADIX_TREE_EXCEPTIONAL_SHIFT + 4)
Jan Karae8043152016-05-12 18:29:16 +020036#define RADIX_DAX_ENTRY_LOCK (1 << RADIX_TREE_EXCEPTIONAL_SHIFT)
Ross Zwisler642261a2016-11-08 11:34:45 +110037#define RADIX_DAX_PMD (1 << (RADIX_TREE_EXCEPTIONAL_SHIFT + 1))
38#define RADIX_DAX_HZP (1 << (RADIX_TREE_EXCEPTIONAL_SHIFT + 2))
39#define RADIX_DAX_EMPTY (1 << (RADIX_TREE_EXCEPTIONAL_SHIFT + 3))
Ross Zwislerfa28f722016-11-08 11:33:35 +110040
Ross Zwisler642261a2016-11-08 11:34:45 +110041static inline unsigned long dax_radix_sector(void *entry)
42{
43 return (unsigned long)entry >> RADIX_DAX_SHIFT;
44}
45
46static inline void *dax_radix_locked_entry(sector_t sector, unsigned long flags)
47{
48 return (void *)(RADIX_TREE_EXCEPTIONAL_ENTRY | flags |
49 ((unsigned long)sector << RADIX_DAX_SHIFT) |
50 RADIX_DAX_ENTRY_LOCK);
51}
Jan Karae8043152016-05-12 18:29:16 +020052
Ross Zwisler11c59c92016-11-08 11:32:46 +110053ssize_t dax_iomap_rw(struct kiocb *iocb, struct iov_iter *iter,
Christoph Hellwig8ff6daa2017-01-27 23:20:26 -080054 const struct iomap_ops *ops);
Dave Jiangc791ace2017-02-24 14:57:08 -080055int dax_iomap_fault(struct vm_fault *vmf, enum page_entry_size pe_size,
56 const struct iomap_ops *ops);
Jan Karaac401cc2016-05-12 18:29:18 +020057int dax_delete_mapping_entry(struct address_space *mapping, pgoff_t index);
Jan Karac6dcf522016-08-10 17:22:44 +020058int dax_invalidate_mapping_entry(struct address_space *mapping, pgoff_t index);
59int dax_invalidate_mapping_entry_sync(struct address_space *mapping,
60 pgoff_t index);
Jan Karaac401cc2016-05-12 18:29:18 +020061void dax_wake_mapping_entry_waiter(struct address_space *mapping,
Ross Zwisler63e95b52016-11-08 11:32:20 +110062 pgoff_t index, void *entry, bool wake_all);
Dan Williamsd1a5f2b42016-01-28 20:25:31 -080063
64#ifdef CONFIG_FS_DAX
65struct page *read_dax_sector(struct block_device *bdev, sector_t n);
Christoph Hellwig679c8bd2016-05-09 10:47:04 +020066int __dax_zero_page_range(struct block_device *bdev, sector_t sector,
67 unsigned int offset, unsigned int length);
Dan Williamsd1a5f2b42016-01-28 20:25:31 -080068#else
69static inline struct page *read_dax_sector(struct block_device *bdev,
70 sector_t n)
71{
72 return ERR_PTR(-ENXIO);
73}
Christoph Hellwig679c8bd2016-05-09 10:47:04 +020074static inline int __dax_zero_page_range(struct block_device *bdev,
75 sector_t sector, unsigned int offset, unsigned int length)
76{
77 return -ENXIO;
78}
Dan Williamsd1a5f2b42016-01-28 20:25:31 -080079#endif
80
Ross Zwisler642261a2016-11-08 11:34:45 +110081#ifdef CONFIG_FS_DAX_PMD
82static inline unsigned int dax_radix_order(void *entry)
83{
84 if ((unsigned long)entry & RADIX_DAX_PMD)
85 return PMD_SHIFT - PAGE_SHIFT;
86 return 0;
87}
Ross Zwisler642261a2016-11-08 11:34:45 +110088#else
89static inline unsigned int dax_radix_order(void *entry)
90{
91 return 0;
92}
Ross Zwisler642261a2016-11-08 11:34:45 +110093#endif
Dave Jiang11bac802017-02-24 14:56:41 -080094int dax_pfn_mkwrite(struct vm_fault *vmf);
Matthew Wilcoxc94c2ac2015-09-08 14:58:40 -070095
Matthew Wilcox4897c762015-09-08 14:58:45 -070096static inline bool vma_is_dax(struct vm_area_struct *vma)
97{
98 return vma->vm_file && IS_DAX(vma->vm_file->f_mapping->host);
99}
Ross Zwislerf9fe48b2016-01-22 15:10:40 -0800100
101static inline bool dax_mapping(struct address_space *mapping)
102{
103 return mapping->host && IS_DAX(mapping->host);
104}
Ross Zwisler7f6d5b52016-02-26 15:19:55 -0800105
106struct writeback_control;
107int dax_writeback_mapping_range(struct address_space *mapping,
108 struct block_device *bdev, struct writeback_control *wbc);
Matthew Wilcoxc94c2ac2015-09-08 14:58:40 -0700109#endif