1 // SPDX-License-Identifier: GPL-2.0-only
3 * Support KVM gust page tracking
5 * This feature allows us to track page access in guest. Currently, only
6 * write access is tracked.
8 * Copyright(C) 2015 Intel Corporation.
11 * Xiao Guangrong <guangrong.xiao@linux.intel.com>
13 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
15 #include <linux/lockdep.h>
16 #include <linux/kvm_host.h>
17 #include <linux/rculist.h>
20 #include "mmu_internal.h"
21 #include "page_track.h"
23 bool kvm_page_track_write_tracking_enabled(struct kvm *kvm)
25 return IS_ENABLED(CONFIG_KVM_EXTERNAL_WRITE_TRACKING) ||
26 !tdp_enabled || kvm_shadow_root_allocated(kvm);
29 void kvm_page_track_free_memslot(struct kvm_memory_slot *slot)
31 kvfree(slot->arch.gfn_write_track);
32 slot->arch.gfn_write_track = NULL;
35 static int __kvm_page_track_write_tracking_alloc(struct kvm_memory_slot *slot,
38 const size_t size = sizeof(*slot->arch.gfn_write_track);
40 if (!slot->arch.gfn_write_track)
41 slot->arch.gfn_write_track = __vcalloc(npages, size,
44 return slot->arch.gfn_write_track ? 0 : -ENOMEM;
47 int kvm_page_track_create_memslot(struct kvm *kvm,
48 struct kvm_memory_slot *slot,
51 if (!kvm_page_track_write_tracking_enabled(kvm))
54 return __kvm_page_track_write_tracking_alloc(slot, npages);
57 int kvm_page_track_write_tracking_alloc(struct kvm_memory_slot *slot)
59 return __kvm_page_track_write_tracking_alloc(slot, slot->npages);
62 static void update_gfn_write_track(struct kvm_memory_slot *slot, gfn_t gfn,
67 index = gfn_to_index(gfn, slot->base_gfn, PG_LEVEL_4K);
69 val = slot->arch.gfn_write_track[index];
71 if (WARN_ON_ONCE(val + count < 0 || val + count > USHRT_MAX))
74 slot->arch.gfn_write_track[index] += count;
77 void __kvm_write_track_add_gfn(struct kvm *kvm, struct kvm_memory_slot *slot,
80 lockdep_assert_held_write(&kvm->mmu_lock);
82 lockdep_assert_once(lockdep_is_held(&kvm->slots_lock) ||
83 srcu_read_lock_held(&kvm->srcu));
85 if (KVM_BUG_ON(!kvm_page_track_write_tracking_enabled(kvm), kvm))
88 update_gfn_write_track(slot, gfn, 1);
91 * new track stops large page mapping for the
94 kvm_mmu_gfn_disallow_lpage(slot, gfn);
96 if (kvm_mmu_slot_gfn_write_protect(kvm, slot, gfn, PG_LEVEL_4K))
97 kvm_flush_remote_tlbs(kvm);
100 void __kvm_write_track_remove_gfn(struct kvm *kvm,
101 struct kvm_memory_slot *slot, gfn_t gfn)
103 lockdep_assert_held_write(&kvm->mmu_lock);
105 lockdep_assert_once(lockdep_is_held(&kvm->slots_lock) ||
106 srcu_read_lock_held(&kvm->srcu));
108 if (KVM_BUG_ON(!kvm_page_track_write_tracking_enabled(kvm), kvm))
111 update_gfn_write_track(slot, gfn, -1);
114 * allow large page mapping for the tracked page
115 * after the tracker is gone.
117 kvm_mmu_gfn_allow_lpage(slot, gfn);
121 * check if the corresponding access on the specified guest page is tracked.
123 bool kvm_gfn_is_write_tracked(struct kvm *kvm,
124 const struct kvm_memory_slot *slot, gfn_t gfn)
131 if (!kvm_page_track_write_tracking_enabled(kvm))
134 index = gfn_to_index(gfn, slot->base_gfn, PG_LEVEL_4K);
135 return !!READ_ONCE(slot->arch.gfn_write_track[index]);
138 #ifdef CONFIG_KVM_EXTERNAL_WRITE_TRACKING
139 void kvm_page_track_cleanup(struct kvm *kvm)
141 struct kvm_page_track_notifier_head *head;
143 head = &kvm->arch.track_notifier_head;
144 cleanup_srcu_struct(&head->track_srcu);
147 int kvm_page_track_init(struct kvm *kvm)
149 struct kvm_page_track_notifier_head *head;
151 head = &kvm->arch.track_notifier_head;
152 INIT_HLIST_HEAD(&head->track_notifier_list);
153 return init_srcu_struct(&head->track_srcu);
157 * register the notifier so that event interception for the tracked guest
158 * pages can be received.
160 int kvm_page_track_register_notifier(struct kvm *kvm,
161 struct kvm_page_track_notifier_node *n)
163 struct kvm_page_track_notifier_head *head;
165 if (!kvm || kvm->mm != current->mm)
170 head = &kvm->arch.track_notifier_head;
172 write_lock(&kvm->mmu_lock);
173 hlist_add_head_rcu(&n->node, &head->track_notifier_list);
174 write_unlock(&kvm->mmu_lock);
177 EXPORT_SYMBOL_GPL(kvm_page_track_register_notifier);
180 * stop receiving the event interception. It is the opposed operation of
181 * kvm_page_track_register_notifier().
183 void kvm_page_track_unregister_notifier(struct kvm *kvm,
184 struct kvm_page_track_notifier_node *n)
186 struct kvm_page_track_notifier_head *head;
188 head = &kvm->arch.track_notifier_head;
190 write_lock(&kvm->mmu_lock);
191 hlist_del_rcu(&n->node);
192 write_unlock(&kvm->mmu_lock);
193 synchronize_srcu(&head->track_srcu);
197 EXPORT_SYMBOL_GPL(kvm_page_track_unregister_notifier);
200 * Notify the node that write access is intercepted and write emulation is
201 * finished at this time.
203 * The node should figure out if the written page is the one that node is
204 * interested in by itself.
206 void __kvm_page_track_write(struct kvm *kvm, gpa_t gpa, const u8 *new, int bytes)
208 struct kvm_page_track_notifier_head *head;
209 struct kvm_page_track_notifier_node *n;
212 head = &kvm->arch.track_notifier_head;
214 if (hlist_empty(&head->track_notifier_list))
217 idx = srcu_read_lock(&head->track_srcu);
218 hlist_for_each_entry_srcu(n, &head->track_notifier_list, node,
219 srcu_read_lock_held(&head->track_srcu))
221 n->track_write(gpa, new, bytes, n);
222 srcu_read_unlock(&head->track_srcu, idx);
226 * Notify external page track nodes that a memory region is being removed from
227 * the VM, e.g. so that users can free any associated metadata.
229 void kvm_page_track_delete_slot(struct kvm *kvm, struct kvm_memory_slot *slot)
231 struct kvm_page_track_notifier_head *head;
232 struct kvm_page_track_notifier_node *n;
235 head = &kvm->arch.track_notifier_head;
237 if (hlist_empty(&head->track_notifier_list))
240 idx = srcu_read_lock(&head->track_srcu);
241 hlist_for_each_entry_srcu(n, &head->track_notifier_list, node,
242 srcu_read_lock_held(&head->track_srcu))
243 if (n->track_remove_region)
244 n->track_remove_region(slot->base_gfn, slot->npages, n);
245 srcu_read_unlock(&head->track_srcu, idx);
249 * add guest page to the tracking pool so that corresponding access on that
250 * page will be intercepted.
252 * @kvm: the guest instance we are interested in.
253 * @gfn: the guest page.
255 int kvm_write_track_add_gfn(struct kvm *kvm, gfn_t gfn)
257 struct kvm_memory_slot *slot;
260 idx = srcu_read_lock(&kvm->srcu);
262 slot = gfn_to_memslot(kvm, gfn);
264 srcu_read_unlock(&kvm->srcu, idx);
268 write_lock(&kvm->mmu_lock);
269 __kvm_write_track_add_gfn(kvm, slot, gfn);
270 write_unlock(&kvm->mmu_lock);
272 srcu_read_unlock(&kvm->srcu, idx);
276 EXPORT_SYMBOL_GPL(kvm_write_track_add_gfn);
279 * remove the guest page from the tracking pool which stops the interception
280 * of corresponding access on that page.
282 * @kvm: the guest instance we are interested in.
283 * @gfn: the guest page.
285 int kvm_write_track_remove_gfn(struct kvm *kvm, gfn_t gfn)
287 struct kvm_memory_slot *slot;
290 idx = srcu_read_lock(&kvm->srcu);
292 slot = gfn_to_memslot(kvm, gfn);
294 srcu_read_unlock(&kvm->srcu, idx);
298 write_lock(&kvm->mmu_lock);
299 __kvm_write_track_remove_gfn(kvm, slot, gfn);
300 write_unlock(&kvm->mmu_lock);
302 srcu_read_unlock(&kvm->srcu, idx);
306 EXPORT_SYMBOL_GPL(kvm_write_track_remove_gfn);