Matthew Wilcox | c94c2ac | 2015-09-08 14:58:40 -0700 | [diff] [blame] | 1 | #ifndef _LINUX_DAX_H |
| 2 | #define _LINUX_DAX_H |
| 3 | |
| 4 | #include <linux/fs.h> |
| 5 | #include <linux/mm.h> |
Jan Kara | 4f62293 | 2016-05-12 18:29:17 +0200 | [diff] [blame] | 6 | #include <linux/radix-tree.h> |
Matthew Wilcox | c94c2ac | 2015-09-08 14:58:40 -0700 | [diff] [blame] | 7 | #include <asm/pgtable.h> |
| 8 | |
Christoph Hellwig | a254e56 | 2016-09-19 11:24:49 +1000 | [diff] [blame] | 9 | struct iomap_ops; |
Dan Williams | 6568b08 | 2017-01-24 18:44:18 -0800 | [diff] [blame] | 10 | struct dax_device; |
| 11 | struct dax_operations { |
| 12 | /* |
| 13 | * direct_access: translate a device-relative |
| 14 | * logical-page-offset into an absolute physical pfn. Return the |
| 15 | * number of pages available for DAX at that pfn. |
| 16 | */ |
| 17 | long (*direct_access)(struct dax_device *, pgoff_t, long, |
| 18 | void **, pfn_t *); |
Dan Williams | 5d61e43 | 2017-06-27 13:06:22 -0700 | [diff] [blame] | 19 | /* copy_from_iter: required operation for fs-dax direct-i/o */ |
Dan Williams | 0aed55a | 2017-05-29 12:22:50 -0700 | [diff] [blame] | 20 | size_t (*copy_from_iter)(struct dax_device *, pgoff_t, void *, size_t, |
| 21 | struct iov_iter *); |
Dan Williams | 3c1cebf | 2017-05-29 12:58:19 -0700 | [diff] [blame] | 22 | /* flush: optional driver-specific cache management after writes */ |
| 23 | void (*flush)(struct dax_device *, pgoff_t, void *, size_t); |
Dan Williams | 6568b08 | 2017-01-24 18:44:18 -0800 | [diff] [blame] | 24 | }; |
Christoph Hellwig | a254e56 | 2016-09-19 11:24:49 +1000 | [diff] [blame] | 25 | |
Dan Williams | 6e0c90d | 2017-06-26 21:28:41 -0700 | [diff] [blame] | 26 | extern struct attribute_group dax_attribute_group; |
| 27 | |
Dan Williams | ef510424 | 2017-05-08 10:55:27 -0700 | [diff] [blame] | 28 | #if IS_ENABLED(CONFIG_DAX) |
| 29 | struct dax_device *dax_get_by_host(const char *host); |
| 30 | void put_dax(struct dax_device *dax_dev); |
| 31 | #else |
| 32 | static inline struct dax_device *dax_get_by_host(const char *host) |
| 33 | { |
| 34 | return NULL; |
| 35 | } |
| 36 | |
| 37 | static inline void put_dax(struct dax_device *dax_dev) |
| 38 | { |
| 39 | } |
| 40 | #endif |
| 41 | |
Dan Williams | f5705aa8c | 2017-05-13 16:31:05 -0700 | [diff] [blame] | 42 | int bdev_dax_pgoff(struct block_device *, sector_t, size_t, pgoff_t *pgoff); |
| 43 | #if IS_ENABLED(CONFIG_FS_DAX) |
| 44 | int __bdev_dax_supported(struct super_block *sb, int blocksize); |
| 45 | static inline int bdev_dax_supported(struct super_block *sb, int blocksize) |
| 46 | { |
| 47 | return __bdev_dax_supported(sb, blocksize); |
| 48 | } |
| 49 | |
| 50 | static inline struct dax_device *fs_dax_get_by_host(const char *host) |
| 51 | { |
| 52 | return dax_get_by_host(host); |
| 53 | } |
| 54 | |
| 55 | static inline void fs_put_dax(struct dax_device *dax_dev) |
| 56 | { |
| 57 | put_dax(dax_dev); |
| 58 | } |
| 59 | |
| 60 | #else |
| 61 | static inline int bdev_dax_supported(struct super_block *sb, int blocksize) |
| 62 | { |
| 63 | return -EOPNOTSUPP; |
| 64 | } |
| 65 | |
| 66 | static inline struct dax_device *fs_dax_get_by_host(const char *host) |
| 67 | { |
| 68 | return NULL; |
| 69 | } |
| 70 | |
| 71 | static inline void fs_put_dax(struct dax_device *dax_dev) |
| 72 | { |
| 73 | } |
| 74 | #endif |
| 75 | |
Dan Williams | 7b6be84 | 2017-04-11 09:49:49 -0700 | [diff] [blame] | 76 | int dax_read_lock(void); |
| 77 | void dax_read_unlock(int id); |
Dan Williams | c1d6e82 | 2017-01-24 23:02:09 -0800 | [diff] [blame] | 78 | struct dax_device *alloc_dax(void *private, const char *host, |
| 79 | const struct dax_operations *ops); |
Dan Williams | c1d6e82 | 2017-01-24 23:02:09 -0800 | [diff] [blame] | 80 | bool dax_alive(struct dax_device *dax_dev); |
| 81 | void kill_dax(struct dax_device *dax_dev); |
| 82 | void *dax_get_private(struct dax_device *dax_dev); |
Dan Williams | b068626 | 2017-01-26 20:37:35 -0800 | [diff] [blame] | 83 | long dax_direct_access(struct dax_device *dax_dev, pgoff_t pgoff, long nr_pages, |
| 84 | void **kaddr, pfn_t *pfn); |
Dan Williams | 7e026c8 | 2017-05-29 12:57:56 -0700 | [diff] [blame] | 85 | size_t dax_copy_from_iter(struct dax_device *dax_dev, pgoff_t pgoff, void *addr, |
| 86 | size_t bytes, struct iov_iter *i); |
Dan Williams | abebfbe | 2017-05-29 13:02:52 -0700 | [diff] [blame] | 87 | void dax_flush(struct dax_device *dax_dev, pgoff_t pgoff, void *addr, |
| 88 | size_t size); |
Dan Williams | 6e0c90d | 2017-06-26 21:28:41 -0700 | [diff] [blame] | 89 | void dax_write_cache(struct dax_device *dax_dev, bool wc); |
Dan Williams | 7b6be84 | 2017-04-11 09:49:49 -0700 | [diff] [blame] | 90 | |
Ross Zwisler | fa28f72 | 2016-11-08 11:33:35 +1100 | [diff] [blame] | 91 | /* |
Ross Zwisler | 642261a | 2016-11-08 11:34:45 +1100 | [diff] [blame] | 92 | * We use lowest available bit in exceptional entry for locking, one bit for |
| 93 | * the entry size (PMD) and two more to tell us if the entry is a huge zero |
| 94 | * page (HZP) or an empty entry that is just used for locking. In total four |
| 95 | * special bits. |
| 96 | * |
| 97 | * If the PMD bit isn't set the entry has size PAGE_SIZE, and if the HZP and |
| 98 | * EMPTY bits aren't set the entry is a normal DAX entry with a filesystem |
| 99 | * block allocation. |
Ross Zwisler | fa28f72 | 2016-11-08 11:33:35 +1100 | [diff] [blame] | 100 | */ |
Ross Zwisler | 642261a | 2016-11-08 11:34:45 +1100 | [diff] [blame] | 101 | #define RADIX_DAX_SHIFT (RADIX_TREE_EXCEPTIONAL_SHIFT + 4) |
Jan Kara | e804315 | 2016-05-12 18:29:16 +0200 | [diff] [blame] | 102 | #define RADIX_DAX_ENTRY_LOCK (1 << RADIX_TREE_EXCEPTIONAL_SHIFT) |
Ross Zwisler | 642261a | 2016-11-08 11:34:45 +1100 | [diff] [blame] | 103 | #define RADIX_DAX_PMD (1 << (RADIX_TREE_EXCEPTIONAL_SHIFT + 1)) |
| 104 | #define RADIX_DAX_HZP (1 << (RADIX_TREE_EXCEPTIONAL_SHIFT + 2)) |
| 105 | #define RADIX_DAX_EMPTY (1 << (RADIX_TREE_EXCEPTIONAL_SHIFT + 3)) |
Ross Zwisler | fa28f72 | 2016-11-08 11:33:35 +1100 | [diff] [blame] | 106 | |
Ross Zwisler | 642261a | 2016-11-08 11:34:45 +1100 | [diff] [blame] | 107 | static inline unsigned long dax_radix_sector(void *entry) |
| 108 | { |
| 109 | return (unsigned long)entry >> RADIX_DAX_SHIFT; |
| 110 | } |
| 111 | |
| 112 | static inline void *dax_radix_locked_entry(sector_t sector, unsigned long flags) |
| 113 | { |
| 114 | return (void *)(RADIX_TREE_EXCEPTIONAL_ENTRY | flags | |
| 115 | ((unsigned long)sector << RADIX_DAX_SHIFT) | |
| 116 | RADIX_DAX_ENTRY_LOCK); |
| 117 | } |
Jan Kara | e804315 | 2016-05-12 18:29:16 +0200 | [diff] [blame] | 118 | |
Ross Zwisler | 11c59c9 | 2016-11-08 11:32:46 +1100 | [diff] [blame] | 119 | ssize_t dax_iomap_rw(struct kiocb *iocb, struct iov_iter *iter, |
Christoph Hellwig | 8ff6daa | 2017-01-27 23:20:26 -0800 | [diff] [blame] | 120 | const struct iomap_ops *ops); |
Dave Jiang | c791ace | 2017-02-24 14:57:08 -0800 | [diff] [blame] | 121 | int dax_iomap_fault(struct vm_fault *vmf, enum page_entry_size pe_size, |
| 122 | const struct iomap_ops *ops); |
Jan Kara | ac401cc | 2016-05-12 18:29:18 +0200 | [diff] [blame] | 123 | int dax_delete_mapping_entry(struct address_space *mapping, pgoff_t index); |
Jan Kara | c6dcf52 | 2016-08-10 17:22:44 +0200 | [diff] [blame] | 124 | int dax_invalidate_mapping_entry_sync(struct address_space *mapping, |
| 125 | pgoff_t index); |
Jan Kara | ac401cc | 2016-05-12 18:29:18 +0200 | [diff] [blame] | 126 | void dax_wake_mapping_entry_waiter(struct address_space *mapping, |
Ross Zwisler | 63e95b5 | 2016-11-08 11:32:20 +1100 | [diff] [blame] | 127 | pgoff_t index, void *entry, bool wake_all); |
Dan Williams | d1a5f2b4 | 2016-01-28 20:25:31 -0800 | [diff] [blame] | 128 | |
| 129 | #ifdef CONFIG_FS_DAX |
Dan Williams | cccbce6 | 2017-01-27 13:31:42 -0800 | [diff] [blame] | 130 | int __dax_zero_page_range(struct block_device *bdev, |
| 131 | struct dax_device *dax_dev, sector_t sector, |
Christoph Hellwig | 679c8bd | 2016-05-09 10:47:04 +0200 | [diff] [blame] | 132 | unsigned int offset, unsigned int length); |
Dan Williams | d1a5f2b4 | 2016-01-28 20:25:31 -0800 | [diff] [blame] | 133 | #else |
Christoph Hellwig | 679c8bd | 2016-05-09 10:47:04 +0200 | [diff] [blame] | 134 | static inline int __dax_zero_page_range(struct block_device *bdev, |
Dan Williams | cccbce6 | 2017-01-27 13:31:42 -0800 | [diff] [blame] | 135 | struct dax_device *dax_dev, sector_t sector, |
| 136 | unsigned int offset, unsigned int length) |
Christoph Hellwig | 679c8bd | 2016-05-09 10:47:04 +0200 | [diff] [blame] | 137 | { |
| 138 | return -ENXIO; |
| 139 | } |
Dan Williams | d1a5f2b4 | 2016-01-28 20:25:31 -0800 | [diff] [blame] | 140 | #endif |
| 141 | |
Ross Zwisler | 642261a | 2016-11-08 11:34:45 +1100 | [diff] [blame] | 142 | #ifdef CONFIG_FS_DAX_PMD |
| 143 | static inline unsigned int dax_radix_order(void *entry) |
| 144 | { |
| 145 | if ((unsigned long)entry & RADIX_DAX_PMD) |
| 146 | return PMD_SHIFT - PAGE_SHIFT; |
| 147 | return 0; |
| 148 | } |
Ross Zwisler | 642261a | 2016-11-08 11:34:45 +1100 | [diff] [blame] | 149 | #else |
| 150 | static inline unsigned int dax_radix_order(void *entry) |
| 151 | { |
| 152 | return 0; |
| 153 | } |
Ross Zwisler | 642261a | 2016-11-08 11:34:45 +1100 | [diff] [blame] | 154 | #endif |
Dave Jiang | 11bac80 | 2017-02-24 14:56:41 -0800 | [diff] [blame] | 155 | int dax_pfn_mkwrite(struct vm_fault *vmf); |
Matthew Wilcox | c94c2ac | 2015-09-08 14:58:40 -0700 | [diff] [blame] | 156 | |
Ross Zwisler | f9fe48b | 2016-01-22 15:10:40 -0800 | [diff] [blame] | 157 | static inline bool dax_mapping(struct address_space *mapping) |
| 158 | { |
| 159 | return mapping->host && IS_DAX(mapping->host); |
| 160 | } |
Ross Zwisler | 7f6d5b5 | 2016-02-26 15:19:55 -0800 | [diff] [blame] | 161 | |
| 162 | struct writeback_control; |
| 163 | int dax_writeback_mapping_range(struct address_space *mapping, |
| 164 | struct block_device *bdev, struct writeback_control *wbc); |
Matthew Wilcox | c94c2ac | 2015-09-08 14:58:40 -0700 | [diff] [blame] | 165 | #endif |