Matthew Wilcox | c94c2ac | 2015-09-08 14:58:40 -0700 | [diff] [blame] | 1 | #ifndef _LINUX_DAX_H |
| 2 | #define _LINUX_DAX_H |
| 3 | |
| 4 | #include <linux/fs.h> |
| 5 | #include <linux/mm.h> |
Jan Kara | 4f62293 | 2016-05-12 18:29:17 +0200 | [diff] [blame] | 6 | #include <linux/radix-tree.h> |
Matthew Wilcox | c94c2ac | 2015-09-08 14:58:40 -0700 | [diff] [blame] | 7 | #include <asm/pgtable.h> |
| 8 | |
Christoph Hellwig | a254e56 | 2016-09-19 11:24:49 +1000 | [diff] [blame] | 9 | struct iomap_ops; |
Dan Williams | 6568b08 | 2017-01-24 18:44:18 -0800 | [diff] [blame] | 10 | struct dax_device; |
| 11 | struct dax_operations { |
| 12 | /* |
| 13 | * direct_access: translate a device-relative |
| 14 | * logical-page-offset into an absolute physical pfn. Return the |
| 15 | * number of pages available for DAX at that pfn. |
| 16 | */ |
| 17 | long (*direct_access)(struct dax_device *, pgoff_t, long, |
| 18 | void **, pfn_t *); |
Dan Williams | 0aed55a | 2017-05-29 12:22:50 -0700 | [diff] [blame] | 19 | /* copy_from_iter: dax-driver override for default copy_from_iter */ |
| 20 | size_t (*copy_from_iter)(struct dax_device *, pgoff_t, void *, size_t, |
| 21 | struct iov_iter *); |
Dan Williams | 3c1cebf | 2017-05-29 12:58:19 -0700 | [diff] [blame] | 22 | /* flush: optional driver-specific cache management after writes */ |
| 23 | void (*flush)(struct dax_device *, pgoff_t, void *, size_t); |
Dan Williams | 6568b08 | 2017-01-24 18:44:18 -0800 | [diff] [blame] | 24 | }; |
Christoph Hellwig | a254e56 | 2016-09-19 11:24:49 +1000 | [diff] [blame] | 25 | |
Dan Williams | ef510424 | 2017-05-08 10:55:27 -0700 | [diff] [blame] | 26 | #if IS_ENABLED(CONFIG_DAX) |
| 27 | struct dax_device *dax_get_by_host(const char *host); |
| 28 | void put_dax(struct dax_device *dax_dev); |
| 29 | #else |
| 30 | static inline struct dax_device *dax_get_by_host(const char *host) |
| 31 | { |
| 32 | return NULL; |
| 33 | } |
| 34 | |
| 35 | static inline void put_dax(struct dax_device *dax_dev) |
| 36 | { |
| 37 | } |
| 38 | #endif |
| 39 | |
Dan Williams | f5705aa8c | 2017-05-13 16:31:05 -0700 | [diff] [blame] | 40 | int bdev_dax_pgoff(struct block_device *, sector_t, size_t, pgoff_t *pgoff); |
| 41 | #if IS_ENABLED(CONFIG_FS_DAX) |
| 42 | int __bdev_dax_supported(struct super_block *sb, int blocksize); |
| 43 | static inline int bdev_dax_supported(struct super_block *sb, int blocksize) |
| 44 | { |
| 45 | return __bdev_dax_supported(sb, blocksize); |
| 46 | } |
| 47 | |
| 48 | static inline struct dax_device *fs_dax_get_by_host(const char *host) |
| 49 | { |
| 50 | return dax_get_by_host(host); |
| 51 | } |
| 52 | |
| 53 | static inline void fs_put_dax(struct dax_device *dax_dev) |
| 54 | { |
| 55 | put_dax(dax_dev); |
| 56 | } |
| 57 | |
| 58 | #else |
| 59 | static inline int bdev_dax_supported(struct super_block *sb, int blocksize) |
| 60 | { |
| 61 | return -EOPNOTSUPP; |
| 62 | } |
| 63 | |
| 64 | static inline struct dax_device *fs_dax_get_by_host(const char *host) |
| 65 | { |
| 66 | return NULL; |
| 67 | } |
| 68 | |
| 69 | static inline void fs_put_dax(struct dax_device *dax_dev) |
| 70 | { |
| 71 | } |
| 72 | #endif |
| 73 | |
Dan Williams | 7b6be84 | 2017-04-11 09:49:49 -0700 | [diff] [blame] | 74 | int dax_read_lock(void); |
| 75 | void dax_read_unlock(int id); |
Dan Williams | c1d6e82 | 2017-01-24 23:02:09 -0800 | [diff] [blame] | 76 | struct dax_device *alloc_dax(void *private, const char *host, |
| 77 | const struct dax_operations *ops); |
Dan Williams | c1d6e82 | 2017-01-24 23:02:09 -0800 | [diff] [blame] | 78 | bool dax_alive(struct dax_device *dax_dev); |
| 79 | void kill_dax(struct dax_device *dax_dev); |
| 80 | void *dax_get_private(struct dax_device *dax_dev); |
Dan Williams | b068626 | 2017-01-26 20:37:35 -0800 | [diff] [blame] | 81 | long dax_direct_access(struct dax_device *dax_dev, pgoff_t pgoff, long nr_pages, |
| 82 | void **kaddr, pfn_t *pfn); |
Dan Williams | 7e026c8 | 2017-05-29 12:57:56 -0700 | [diff] [blame] | 83 | size_t dax_copy_from_iter(struct dax_device *dax_dev, pgoff_t pgoff, void *addr, |
| 84 | size_t bytes, struct iov_iter *i); |
Dan Williams | abebfbe | 2017-05-29 13:02:52 -0700 | [diff] [blame^] | 85 | void dax_flush(struct dax_device *dax_dev, pgoff_t pgoff, void *addr, |
| 86 | size_t size); |
Dan Williams | 7b6be84 | 2017-04-11 09:49:49 -0700 | [diff] [blame] | 87 | |
Ross Zwisler | fa28f72 | 2016-11-08 11:33:35 +1100 | [diff] [blame] | 88 | /* |
Ross Zwisler | 642261a | 2016-11-08 11:34:45 +1100 | [diff] [blame] | 89 | * We use lowest available bit in exceptional entry for locking, one bit for |
| 90 | * the entry size (PMD) and two more to tell us if the entry is a huge zero |
| 91 | * page (HZP) or an empty entry that is just used for locking. In total four |
| 92 | * special bits. |
| 93 | * |
| 94 | * If the PMD bit isn't set the entry has size PAGE_SIZE, and if the HZP and |
| 95 | * EMPTY bits aren't set the entry is a normal DAX entry with a filesystem |
| 96 | * block allocation. |
Ross Zwisler | fa28f72 | 2016-11-08 11:33:35 +1100 | [diff] [blame] | 97 | */ |
Ross Zwisler | 642261a | 2016-11-08 11:34:45 +1100 | [diff] [blame] | 98 | #define RADIX_DAX_SHIFT (RADIX_TREE_EXCEPTIONAL_SHIFT + 4) |
Jan Kara | e804315 | 2016-05-12 18:29:16 +0200 | [diff] [blame] | 99 | #define RADIX_DAX_ENTRY_LOCK (1 << RADIX_TREE_EXCEPTIONAL_SHIFT) |
Ross Zwisler | 642261a | 2016-11-08 11:34:45 +1100 | [diff] [blame] | 100 | #define RADIX_DAX_PMD (1 << (RADIX_TREE_EXCEPTIONAL_SHIFT + 1)) |
| 101 | #define RADIX_DAX_HZP (1 << (RADIX_TREE_EXCEPTIONAL_SHIFT + 2)) |
| 102 | #define RADIX_DAX_EMPTY (1 << (RADIX_TREE_EXCEPTIONAL_SHIFT + 3)) |
Ross Zwisler | fa28f72 | 2016-11-08 11:33:35 +1100 | [diff] [blame] | 103 | |
Ross Zwisler | 642261a | 2016-11-08 11:34:45 +1100 | [diff] [blame] | 104 | static inline unsigned long dax_radix_sector(void *entry) |
| 105 | { |
| 106 | return (unsigned long)entry >> RADIX_DAX_SHIFT; |
| 107 | } |
| 108 | |
| 109 | static inline void *dax_radix_locked_entry(sector_t sector, unsigned long flags) |
| 110 | { |
| 111 | return (void *)(RADIX_TREE_EXCEPTIONAL_ENTRY | flags | |
| 112 | ((unsigned long)sector << RADIX_DAX_SHIFT) | |
| 113 | RADIX_DAX_ENTRY_LOCK); |
| 114 | } |
Jan Kara | e804315 | 2016-05-12 18:29:16 +0200 | [diff] [blame] | 115 | |
Ross Zwisler | 11c59c9 | 2016-11-08 11:32:46 +1100 | [diff] [blame] | 116 | ssize_t dax_iomap_rw(struct kiocb *iocb, struct iov_iter *iter, |
Christoph Hellwig | 8ff6daa | 2017-01-27 23:20:26 -0800 | [diff] [blame] | 117 | const struct iomap_ops *ops); |
Dave Jiang | c791ace | 2017-02-24 14:57:08 -0800 | [diff] [blame] | 118 | int dax_iomap_fault(struct vm_fault *vmf, enum page_entry_size pe_size, |
| 119 | const struct iomap_ops *ops); |
Jan Kara | ac401cc | 2016-05-12 18:29:18 +0200 | [diff] [blame] | 120 | int dax_delete_mapping_entry(struct address_space *mapping, pgoff_t index); |
Jan Kara | c6dcf52 | 2016-08-10 17:22:44 +0200 | [diff] [blame] | 121 | int dax_invalidate_mapping_entry_sync(struct address_space *mapping, |
| 122 | pgoff_t index); |
Jan Kara | ac401cc | 2016-05-12 18:29:18 +0200 | [diff] [blame] | 123 | void dax_wake_mapping_entry_waiter(struct address_space *mapping, |
Ross Zwisler | 63e95b5 | 2016-11-08 11:32:20 +1100 | [diff] [blame] | 124 | pgoff_t index, void *entry, bool wake_all); |
Dan Williams | d1a5f2b4 | 2016-01-28 20:25:31 -0800 | [diff] [blame] | 125 | |
| 126 | #ifdef CONFIG_FS_DAX |
Dan Williams | cccbce6 | 2017-01-27 13:31:42 -0800 | [diff] [blame] | 127 | int __dax_zero_page_range(struct block_device *bdev, |
| 128 | struct dax_device *dax_dev, sector_t sector, |
Christoph Hellwig | 679c8bd | 2016-05-09 10:47:04 +0200 | [diff] [blame] | 129 | unsigned int offset, unsigned int length); |
Dan Williams | d1a5f2b4 | 2016-01-28 20:25:31 -0800 | [diff] [blame] | 130 | #else |
Christoph Hellwig | 679c8bd | 2016-05-09 10:47:04 +0200 | [diff] [blame] | 131 | static inline int __dax_zero_page_range(struct block_device *bdev, |
Dan Williams | cccbce6 | 2017-01-27 13:31:42 -0800 | [diff] [blame] | 132 | struct dax_device *dax_dev, sector_t sector, |
| 133 | unsigned int offset, unsigned int length) |
Christoph Hellwig | 679c8bd | 2016-05-09 10:47:04 +0200 | [diff] [blame] | 134 | { |
| 135 | return -ENXIO; |
| 136 | } |
Dan Williams | d1a5f2b4 | 2016-01-28 20:25:31 -0800 | [diff] [blame] | 137 | #endif |
| 138 | |
Ross Zwisler | 642261a | 2016-11-08 11:34:45 +1100 | [diff] [blame] | 139 | #ifdef CONFIG_FS_DAX_PMD |
| 140 | static inline unsigned int dax_radix_order(void *entry) |
| 141 | { |
| 142 | if ((unsigned long)entry & RADIX_DAX_PMD) |
| 143 | return PMD_SHIFT - PAGE_SHIFT; |
| 144 | return 0; |
| 145 | } |
Ross Zwisler | 642261a | 2016-11-08 11:34:45 +1100 | [diff] [blame] | 146 | #else |
| 147 | static inline unsigned int dax_radix_order(void *entry) |
| 148 | { |
| 149 | return 0; |
| 150 | } |
Ross Zwisler | 642261a | 2016-11-08 11:34:45 +1100 | [diff] [blame] | 151 | #endif |
Dave Jiang | 11bac80 | 2017-02-24 14:56:41 -0800 | [diff] [blame] | 152 | int dax_pfn_mkwrite(struct vm_fault *vmf); |
Matthew Wilcox | c94c2ac | 2015-09-08 14:58:40 -0700 | [diff] [blame] | 153 | |
Matthew Wilcox | 4897c76 | 2015-09-08 14:58:45 -0700 | [diff] [blame] | 154 | static inline bool vma_is_dax(struct vm_area_struct *vma) |
| 155 | { |
| 156 | return vma->vm_file && IS_DAX(vma->vm_file->f_mapping->host); |
| 157 | } |
Ross Zwisler | f9fe48b | 2016-01-22 15:10:40 -0800 | [diff] [blame] | 158 | |
| 159 | static inline bool dax_mapping(struct address_space *mapping) |
| 160 | { |
| 161 | return mapping->host && IS_DAX(mapping->host); |
| 162 | } |
Ross Zwisler | 7f6d5b5 | 2016-02-26 15:19:55 -0800 | [diff] [blame] | 163 | |
| 164 | struct writeback_control; |
| 165 | int dax_writeback_mapping_range(struct address_space *mapping, |
| 166 | struct block_device *bdev, struct writeback_control *wbc); |
Matthew Wilcox | c94c2ac | 2015-09-08 14:58:40 -0700 | [diff] [blame] | 167 | #endif |