blob: ac8afa18f707410ec6b837051f7395650ac6f4dc [file] [log] [blame]
Matthew Wilcoxc94c2ac2015-09-08 14:58:40 -07001#ifndef _LINUX_DAX_H
2#define _LINUX_DAX_H
3
4#include <linux/fs.h>
5#include <linux/mm.h>
Jan Kara4f622932016-05-12 18:29:17 +02006#include <linux/radix-tree.h>
Matthew Wilcoxc94c2ac2015-09-08 14:58:40 -07007#include <asm/pgtable.h>
8
Christoph Hellwiga254e562016-09-19 11:24:49 +10009struct iomap_ops;
Dan Williams6568b082017-01-24 18:44:18 -080010struct dax_device;
11struct dax_operations {
12 /*
13 * direct_access: translate a device-relative
14 * logical-page-offset into an absolute physical pfn. Return the
15 * number of pages available for DAX at that pfn.
16 */
17 long (*direct_access)(struct dax_device *, pgoff_t, long,
18 void **, pfn_t *);
Dan Williams5d61e432017-06-27 13:06:22 -070019 /* copy_from_iter: required operation for fs-dax direct-i/o */
Dan Williams0aed55a2017-05-29 12:22:50 -070020 size_t (*copy_from_iter)(struct dax_device *, pgoff_t, void *, size_t,
21 struct iov_iter *);
Dan Williams3c1cebf2017-05-29 12:58:19 -070022 /* flush: optional driver-specific cache management after writes */
23 void (*flush)(struct dax_device *, pgoff_t, void *, size_t);
Dan Williams6568b082017-01-24 18:44:18 -080024};
Christoph Hellwiga254e562016-09-19 11:24:49 +100025
Dan Williams6e0c90d2017-06-26 21:28:41 -070026extern struct attribute_group dax_attribute_group;
27
Dan Williamsef5104242017-05-08 10:55:27 -070028#if IS_ENABLED(CONFIG_DAX)
29struct dax_device *dax_get_by_host(const char *host);
30void put_dax(struct dax_device *dax_dev);
31#else
32static inline struct dax_device *dax_get_by_host(const char *host)
33{
34 return NULL;
35}
36
37static inline void put_dax(struct dax_device *dax_dev)
38{
39}
40#endif
41
Dan Williamsf5705aa8c2017-05-13 16:31:05 -070042int bdev_dax_pgoff(struct block_device *, sector_t, size_t, pgoff_t *pgoff);
43#if IS_ENABLED(CONFIG_FS_DAX)
44int __bdev_dax_supported(struct super_block *sb, int blocksize);
45static inline int bdev_dax_supported(struct super_block *sb, int blocksize)
46{
47 return __bdev_dax_supported(sb, blocksize);
48}
49
50static inline struct dax_device *fs_dax_get_by_host(const char *host)
51{
52 return dax_get_by_host(host);
53}
54
55static inline void fs_put_dax(struct dax_device *dax_dev)
56{
57 put_dax(dax_dev);
58}
59
Dan Williams78f35472017-08-30 09:16:38 -070060struct dax_device *fs_dax_get_by_bdev(struct block_device *bdev);
Dan Williamsf5705aa8c2017-05-13 16:31:05 -070061#else
62static inline int bdev_dax_supported(struct super_block *sb, int blocksize)
63{
64 return -EOPNOTSUPP;
65}
66
67static inline struct dax_device *fs_dax_get_by_host(const char *host)
68{
69 return NULL;
70}
71
72static inline void fs_put_dax(struct dax_device *dax_dev)
73{
74}
Dan Williams78f35472017-08-30 09:16:38 -070075
76static inline struct dax_device *fs_dax_get_by_bdev(struct block_device *bdev)
77{
78 return NULL;
79}
Dan Williamsf5705aa8c2017-05-13 16:31:05 -070080#endif
81
Dan Williams7b6be842017-04-11 09:49:49 -070082int dax_read_lock(void);
83void dax_read_unlock(int id);
Dan Williamsc1d6e822017-01-24 23:02:09 -080084struct dax_device *alloc_dax(void *private, const char *host,
85 const struct dax_operations *ops);
Dan Williamsc1d6e822017-01-24 23:02:09 -080086bool dax_alive(struct dax_device *dax_dev);
87void kill_dax(struct dax_device *dax_dev);
88void *dax_get_private(struct dax_device *dax_dev);
Dan Williamsb0686262017-01-26 20:37:35 -080089long dax_direct_access(struct dax_device *dax_dev, pgoff_t pgoff, long nr_pages,
90 void **kaddr, pfn_t *pfn);
Dan Williams7e026c82017-05-29 12:57:56 -070091size_t dax_copy_from_iter(struct dax_device *dax_dev, pgoff_t pgoff, void *addr,
92 size_t bytes, struct iov_iter *i);
Dan Williamsabebfbe22017-05-29 13:02:52 -070093void dax_flush(struct dax_device *dax_dev, pgoff_t pgoff, void *addr,
94 size_t size);
Dan Williams6e0c90d2017-06-26 21:28:41 -070095void dax_write_cache(struct dax_device *dax_dev, bool wc);
Vivek Goyal273752c2017-07-26 09:35:09 -040096bool dax_write_cache_enabled(struct dax_device *dax_dev);
Dan Williams7b6be842017-04-11 09:49:49 -070097
Ross Zwislerfa28f722016-11-08 11:33:35 +110098/*
Ross Zwisler642261a2016-11-08 11:34:45 +110099 * We use lowest available bit in exceptional entry for locking, one bit for
100 * the entry size (PMD) and two more to tell us if the entry is a huge zero
101 * page (HZP) or an empty entry that is just used for locking. In total four
102 * special bits.
103 *
104 * If the PMD bit isn't set the entry has size PAGE_SIZE, and if the HZP and
105 * EMPTY bits aren't set the entry is a normal DAX entry with a filesystem
106 * block allocation.
Ross Zwislerfa28f722016-11-08 11:33:35 +1100107 */
Ross Zwisler642261a2016-11-08 11:34:45 +1100108#define RADIX_DAX_SHIFT (RADIX_TREE_EXCEPTIONAL_SHIFT + 4)
Jan Karae8043152016-05-12 18:29:16 +0200109#define RADIX_DAX_ENTRY_LOCK (1 << RADIX_TREE_EXCEPTIONAL_SHIFT)
Ross Zwisler642261a2016-11-08 11:34:45 +1100110#define RADIX_DAX_PMD (1 << (RADIX_TREE_EXCEPTIONAL_SHIFT + 1))
111#define RADIX_DAX_HZP (1 << (RADIX_TREE_EXCEPTIONAL_SHIFT + 2))
112#define RADIX_DAX_EMPTY (1 << (RADIX_TREE_EXCEPTIONAL_SHIFT + 3))
Ross Zwislerfa28f722016-11-08 11:33:35 +1100113
Ross Zwisler642261a2016-11-08 11:34:45 +1100114static inline unsigned long dax_radix_sector(void *entry)
115{
116 return (unsigned long)entry >> RADIX_DAX_SHIFT;
117}
118
119static inline void *dax_radix_locked_entry(sector_t sector, unsigned long flags)
120{
121 return (void *)(RADIX_TREE_EXCEPTIONAL_ENTRY | flags |
122 ((unsigned long)sector << RADIX_DAX_SHIFT) |
123 RADIX_DAX_ENTRY_LOCK);
124}
Jan Karae8043152016-05-12 18:29:16 +0200125
Ross Zwisler11c59c92016-11-08 11:32:46 +1100126ssize_t dax_iomap_rw(struct kiocb *iocb, struct iov_iter *iter,
Christoph Hellwig8ff6daa2017-01-27 23:20:26 -0800127 const struct iomap_ops *ops);
Dave Jiangc791ace2017-02-24 14:57:08 -0800128int dax_iomap_fault(struct vm_fault *vmf, enum page_entry_size pe_size,
129 const struct iomap_ops *ops);
Jan Karaac401cc2016-05-12 18:29:18 +0200130int dax_delete_mapping_entry(struct address_space *mapping, pgoff_t index);
Jan Karac6dcf522016-08-10 17:22:44 +0200131int dax_invalidate_mapping_entry_sync(struct address_space *mapping,
132 pgoff_t index);
Jan Karaac401cc2016-05-12 18:29:18 +0200133void dax_wake_mapping_entry_waiter(struct address_space *mapping,
Ross Zwisler63e95b52016-11-08 11:32:20 +1100134 pgoff_t index, void *entry, bool wake_all);
Dan Williamsd1a5f2b42016-01-28 20:25:31 -0800135
136#ifdef CONFIG_FS_DAX
Dan Williamscccbce62017-01-27 13:31:42 -0800137int __dax_zero_page_range(struct block_device *bdev,
138 struct dax_device *dax_dev, sector_t sector,
Christoph Hellwig679c8bd2016-05-09 10:47:04 +0200139 unsigned int offset, unsigned int length);
Dan Williamsd1a5f2b42016-01-28 20:25:31 -0800140#else
Christoph Hellwig679c8bd2016-05-09 10:47:04 +0200141static inline int __dax_zero_page_range(struct block_device *bdev,
Dan Williamscccbce62017-01-27 13:31:42 -0800142 struct dax_device *dax_dev, sector_t sector,
143 unsigned int offset, unsigned int length)
Christoph Hellwig679c8bd2016-05-09 10:47:04 +0200144{
145 return -ENXIO;
146}
Dan Williamsd1a5f2b42016-01-28 20:25:31 -0800147#endif
148
Ross Zwisler642261a2016-11-08 11:34:45 +1100149#ifdef CONFIG_FS_DAX_PMD
150static inline unsigned int dax_radix_order(void *entry)
151{
152 if ((unsigned long)entry & RADIX_DAX_PMD)
153 return PMD_SHIFT - PAGE_SHIFT;
154 return 0;
155}
Ross Zwisler642261a2016-11-08 11:34:45 +1100156#else
157static inline unsigned int dax_radix_order(void *entry)
158{
159 return 0;
160}
Ross Zwisler642261a2016-11-08 11:34:45 +1100161#endif
Dave Jiang11bac802017-02-24 14:56:41 -0800162int dax_pfn_mkwrite(struct vm_fault *vmf);
Matthew Wilcoxc94c2ac2015-09-08 14:58:40 -0700163
Ross Zwislerf9fe48b2016-01-22 15:10:40 -0800164static inline bool dax_mapping(struct address_space *mapping)
165{
166 return mapping->host && IS_DAX(mapping->host);
167}
Ross Zwisler7f6d5b52016-02-26 15:19:55 -0800168
169struct writeback_control;
170int dax_writeback_mapping_range(struct address_space *mapping,
171 struct block_device *bdev, struct writeback_control *wbc);
Matthew Wilcoxc94c2ac2015-09-08 14:58:40 -0700172#endif