Thomas Gleixner | c942fdd | 2019-05-27 08:55:06 +0200 | [diff] [blame] | 1 | /* SPDX-License-Identifier: GPL-2.0-or-later */ |
Jérôme Glisse | 133ff0e | 2017-09-08 16:11:23 -0700 | [diff] [blame] | 2 | /* |
| 3 | * Copyright 2013 Red Hat Inc. |
| 4 | * |
Jérôme Glisse | f813f21 | 2018-10-30 15:04:06 -0700 | [diff] [blame] | 5 | * Authors: Jérôme Glisse <[email protected]> |
Jérôme Glisse | 133ff0e | 2017-09-08 16:11:23 -0700 | [diff] [blame] | 6 | * |
Jason Gunthorpe | f970b97 | 2020-03-27 17:00:15 -0300 | [diff] [blame] | 7 | * See Documentation/vm/hmm.rst for reasons and overview of what HMM is. |
Jérôme Glisse | 133ff0e | 2017-09-08 16:11:23 -0700 | [diff] [blame] | 8 | */ |
| 9 | #ifndef LINUX_HMM_H |
| 10 | #define LINUX_HMM_H |
| 11 | |
| 12 | #include <linux/kconfig.h> |
Mike Rapoport | ca5999f | 2020-06-08 21:32:38 -0700 | [diff] [blame] | 13 | #include <linux/pgtable.h> |
Jérôme Glisse | 133ff0e | 2017-09-08 16:11:23 -0700 | [diff] [blame] | 14 | |
Jérôme Glisse | 858b54d | 2017-09-08 16:12:02 -0700 | [diff] [blame] | 15 | #include <linux/device.h> |
Jérôme Glisse | 4ef589d | 2017-09-08 16:11:58 -0700 | [diff] [blame] | 16 | #include <linux/migrate.h> |
| 17 | #include <linux/memremap.h> |
| 18 | #include <linux/completion.h> |
Jérôme Glisse | a3e0d41 | 2019-05-13 17:20:01 -0700 | [diff] [blame] | 19 | #include <linux/mmu_notifier.h> |
Jérôme Glisse | 4ef589d | 2017-09-08 16:11:58 -0700 | [diff] [blame] | 20 | |
Jérôme Glisse | 133ff0e | 2017-09-08 16:11:23 -0700 | [diff] [blame] | 21 | /* |
Jason Gunthorpe | 2733ea1 | 2020-05-01 15:20:48 -0300 | [diff] [blame] | 22 | * On output: |
| 23 | * 0 - The page is faultable and a future call with |
| 24 | * HMM_PFN_REQ_FAULT could succeed. |
| 25 | * HMM_PFN_VALID - the pfn field points to a valid PFN. This PFN is at |
| 26 | * least readable. If dev_private_owner is !NULL then this could |
| 27 | * point at a DEVICE_PRIVATE page. |
| 28 | * HMM_PFN_WRITE - if the page memory can be written to (requires HMM_PFN_VALID) |
| 29 | * HMM_PFN_ERROR - accessing the pfn is impossible and the device should |
| 30 | * fail. ie poisoned memory, special pages, no vma, etc |
Jérôme Glisse | f88a1e9 | 2018-04-10 16:29:06 -0700 | [diff] [blame] | 31 | * |
Jason Gunthorpe | 2733ea1 | 2020-05-01 15:20:48 -0300 | [diff] [blame] | 32 | * On input: |
| 33 | * 0 - Return the current state of the page, do not fault it. |
| 34 | * HMM_PFN_REQ_FAULT - The output must have HMM_PFN_VALID or hmm_range_fault() |
| 35 | * will fail |
| 36 | * HMM_PFN_REQ_WRITE - The output must have HMM_PFN_WRITE or hmm_range_fault() |
| 37 | * will fail. Must be combined with HMM_PFN_REQ_FAULT. |
Jérôme Glisse | f88a1e9 | 2018-04-10 16:29:06 -0700 | [diff] [blame] | 38 | */ |
Jason Gunthorpe | 2733ea1 | 2020-05-01 15:20:48 -0300 | [diff] [blame] | 39 | enum hmm_pfn_flags { |
Ralph Campbell | 3b50a6e | 2020-07-01 15:53:49 -0700 | [diff] [blame] | 40 | /* Output fields and flags */ |
Jason Gunthorpe | 2733ea1 | 2020-05-01 15:20:48 -0300 | [diff] [blame] | 41 | HMM_PFN_VALID = 1UL << (BITS_PER_LONG - 1), |
| 42 | HMM_PFN_WRITE = 1UL << (BITS_PER_LONG - 2), |
| 43 | HMM_PFN_ERROR = 1UL << (BITS_PER_LONG - 3), |
Ralph Campbell | 3b50a6e | 2020-07-01 15:53:49 -0700 | [diff] [blame] | 44 | HMM_PFN_ORDER_SHIFT = (BITS_PER_LONG - 8), |
Jason Gunthorpe | 2733ea1 | 2020-05-01 15:20:48 -0300 | [diff] [blame] | 45 | |
| 46 | /* Input flags */ |
| 47 | HMM_PFN_REQ_FAULT = HMM_PFN_VALID, |
| 48 | HMM_PFN_REQ_WRITE = HMM_PFN_WRITE, |
| 49 | |
Ralph Campbell | 3b50a6e | 2020-07-01 15:53:49 -0700 | [diff] [blame] | 50 | HMM_PFN_FLAGS = 0xFFUL << HMM_PFN_ORDER_SHIFT, |
Jérôme Glisse | f88a1e9 | 2018-04-10 16:29:06 -0700 | [diff] [blame] | 51 | }; |
| 52 | |
| 53 | /* |
Jason Gunthorpe | 2733ea1 | 2020-05-01 15:20:48 -0300 | [diff] [blame] | 54 | * hmm_pfn_to_page() - return struct page pointed to by a device entry |
Jérôme Glisse | f88a1e9 | 2018-04-10 16:29:06 -0700 | [diff] [blame] | 55 | * |
Jason Gunthorpe | 2733ea1 | 2020-05-01 15:20:48 -0300 | [diff] [blame] | 56 | * This must be called under the caller 'user_lock' after a successful |
| 57 | * mmu_interval_read_begin(). The caller must have tested for HMM_PFN_VALID |
| 58 | * already. |
Jérôme Glisse | 133ff0e | 2017-09-08 16:11:23 -0700 | [diff] [blame] | 59 | */ |
Jason Gunthorpe | 2733ea1 | 2020-05-01 15:20:48 -0300 | [diff] [blame] | 60 | static inline struct page *hmm_pfn_to_page(unsigned long hmm_pfn) |
| 61 | { |
| 62 | return pfn_to_page(hmm_pfn & ~HMM_PFN_FLAGS); |
| 63 | } |
Jérôme Glisse | f88a1e9 | 2018-04-10 16:29:06 -0700 | [diff] [blame] | 64 | |
| 65 | /* |
Ralph Campbell | 3b50a6e | 2020-07-01 15:53:49 -0700 | [diff] [blame] | 66 | * hmm_pfn_to_map_order() - return the CPU mapping size order |
| 67 | * |
| 68 | * This is optionally useful to optimize processing of the pfn result |
| 69 | * array. It indicates that the page starts at the order aligned VA and is |
| 70 | * 1<<order bytes long. Every pfn within an high order page will have the |
| 71 | * same pfn flags, both access protections and the map_order. The caller must |
| 72 | * be careful with edge cases as the start and end VA of the given page may |
| 73 | * extend past the range used with hmm_range_fault(). |
| 74 | * |
| 75 | * This must be called under the caller 'user_lock' after a successful |
| 76 | * mmu_interval_read_begin(). The caller must have tested for HMM_PFN_VALID |
| 77 | * already. |
| 78 | */ |
| 79 | static inline unsigned int hmm_pfn_to_map_order(unsigned long hmm_pfn) |
| 80 | { |
| 81 | return (hmm_pfn >> HMM_PFN_ORDER_SHIFT) & 0x1F; |
| 82 | } |
| 83 | |
| 84 | /* |
Jérôme Glisse | f88a1e9 | 2018-04-10 16:29:06 -0700 | [diff] [blame] | 85 | * struct hmm_range - track invalidation lock on virtual address range |
| 86 | * |
Jason Gunthorpe | a22dd50 | 2019-11-12 16:22:30 -0400 | [diff] [blame] | 87 | * @notifier: a mmu_interval_notifier that includes the start/end |
| 88 | * @notifier_seq: result of mmu_interval_read_begin() |
Jérôme Glisse | f88a1e9 | 2018-04-10 16:29:06 -0700 | [diff] [blame] | 89 | * @start: range virtual start address (inclusive) |
| 90 | * @end: range virtual end address (exclusive) |
Jason Gunthorpe | 2733ea1 | 2020-05-01 15:20:48 -0300 | [diff] [blame] | 91 | * @hmm_pfns: array of pfns (big enough for the range) |
Jérôme Glisse | 023a019 | 2019-05-13 17:20:05 -0700 | [diff] [blame] | 92 | * @default_flags: default flags for the range (write, read, ... see hmm doc) |
| 93 | * @pfn_flags_mask: allows to mask pfn flags so that only default_flags matter |
Christoph Hellwig | 08ddddd | 2020-03-16 20:32:16 +0100 | [diff] [blame] | 94 | * @dev_private_owner: owner of device private pages |
Jérôme Glisse | f88a1e9 | 2018-04-10 16:29:06 -0700 | [diff] [blame] | 95 | */ |
| 96 | struct hmm_range { |
Jason Gunthorpe | 04ec32f | 2019-11-12 16:22:20 -0400 | [diff] [blame] | 97 | struct mmu_interval_notifier *notifier; |
| 98 | unsigned long notifier_seq; |
Jérôme Glisse | f88a1e9 | 2018-04-10 16:29:06 -0700 | [diff] [blame] | 99 | unsigned long start; |
| 100 | unsigned long end; |
Jason Gunthorpe | 2733ea1 | 2020-05-01 15:20:48 -0300 | [diff] [blame] | 101 | unsigned long *hmm_pfns; |
| 102 | unsigned long default_flags; |
| 103 | unsigned long pfn_flags_mask; |
Christoph Hellwig | 08ddddd | 2020-03-16 20:32:16 +0100 | [diff] [blame] | 104 | void *dev_private_owner; |
Jérôme Glisse | f88a1e9 | 2018-04-10 16:29:06 -0700 | [diff] [blame] | 105 | }; |
Jérôme Glisse | 133ff0e | 2017-09-08 16:11:23 -0700 | [diff] [blame] | 106 | |
| 107 | /* |
Jérôme Glisse | a3e0d41 | 2019-05-13 17:20:01 -0700 | [diff] [blame] | 108 | * Please see Documentation/vm/hmm.rst for how to use the range API. |
Jérôme Glisse | da4c3c7 | 2017-09-08 16:11:31 -0700 | [diff] [blame] | 109 | */ |
Jason Gunthorpe | be957c8 | 2020-05-01 15:20:45 -0300 | [diff] [blame] | 110 | int hmm_range_fault(struct hmm_range *range); |
Jérôme Glisse | 74eee18 | 2017-09-08 16:11:35 -0700 | [diff] [blame] | 111 | |
| 112 | /* |
Jérôme Glisse | a3e0d41 | 2019-05-13 17:20:01 -0700 | [diff] [blame] | 113 | * HMM_RANGE_DEFAULT_TIMEOUT - default timeout (ms) when waiting for a range |
Jérôme Glisse | 74eee18 | 2017-09-08 16:11:35 -0700 | [diff] [blame] | 114 | * |
Jérôme Glisse | a3e0d41 | 2019-05-13 17:20:01 -0700 | [diff] [blame] | 115 | * When waiting for mmu notifiers we need some kind of time out otherwise we |
Zhen Lei | 06c8839 | 2021-07-07 18:08:19 -0700 | [diff] [blame^] | 116 | * could potentially wait for ever, 1000ms ie 1s sounds like a long time to |
Jérôme Glisse | a3e0d41 | 2019-05-13 17:20:01 -0700 | [diff] [blame] | 117 | * wait already. |
Jérôme Glisse | 74eee18 | 2017-09-08 16:11:35 -0700 | [diff] [blame] | 118 | */ |
Jérôme Glisse | a3e0d41 | 2019-05-13 17:20:01 -0700 | [diff] [blame] | 119 | #define HMM_RANGE_DEFAULT_TIMEOUT 1000 |
| 120 | |
Jérôme Glisse | 133ff0e | 2017-09-08 16:11:23 -0700 | [diff] [blame] | 121 | #endif /* LINUX_HMM_H */ |