xref: /OK3568_Linux_fs/kernel/arch/x86/kvm/mmu/page_track.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Support KVM gust page tracking
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * This feature allows us to track page access in guest. Currently, only
6*4882a593Smuzhiyun  * write access is tracked.
7*4882a593Smuzhiyun  *
8*4882a593Smuzhiyun  * Copyright(C) 2015 Intel Corporation.
9*4882a593Smuzhiyun  *
10*4882a593Smuzhiyun  * Author:
11*4882a593Smuzhiyun  *   Xiao Guangrong <guangrong.xiao@linux.intel.com>
12*4882a593Smuzhiyun  */
13*4882a593Smuzhiyun 
14*4882a593Smuzhiyun #include <linux/kvm_host.h>
15*4882a593Smuzhiyun #include <linux/rculist.h>
16*4882a593Smuzhiyun 
17*4882a593Smuzhiyun #include <asm/kvm_page_track.h>
18*4882a593Smuzhiyun 
19*4882a593Smuzhiyun #include "mmu_internal.h"
20*4882a593Smuzhiyun 
kvm_page_track_free_memslot(struct kvm_memory_slot * slot)21*4882a593Smuzhiyun void kvm_page_track_free_memslot(struct kvm_memory_slot *slot)
22*4882a593Smuzhiyun {
23*4882a593Smuzhiyun 	int i;
24*4882a593Smuzhiyun 
25*4882a593Smuzhiyun 	for (i = 0; i < KVM_PAGE_TRACK_MAX; i++) {
26*4882a593Smuzhiyun 		kvfree(slot->arch.gfn_track[i]);
27*4882a593Smuzhiyun 		slot->arch.gfn_track[i] = NULL;
28*4882a593Smuzhiyun 	}
29*4882a593Smuzhiyun }
30*4882a593Smuzhiyun 
kvm_page_track_create_memslot(struct kvm_memory_slot * slot,unsigned long npages)31*4882a593Smuzhiyun int kvm_page_track_create_memslot(struct kvm_memory_slot *slot,
32*4882a593Smuzhiyun 				  unsigned long npages)
33*4882a593Smuzhiyun {
34*4882a593Smuzhiyun 	int  i;
35*4882a593Smuzhiyun 
36*4882a593Smuzhiyun 	for (i = 0; i < KVM_PAGE_TRACK_MAX; i++) {
37*4882a593Smuzhiyun 		slot->arch.gfn_track[i] =
38*4882a593Smuzhiyun 			kvcalloc(npages, sizeof(*slot->arch.gfn_track[i]),
39*4882a593Smuzhiyun 				 GFP_KERNEL_ACCOUNT);
40*4882a593Smuzhiyun 		if (!slot->arch.gfn_track[i])
41*4882a593Smuzhiyun 			goto track_free;
42*4882a593Smuzhiyun 	}
43*4882a593Smuzhiyun 
44*4882a593Smuzhiyun 	return 0;
45*4882a593Smuzhiyun 
46*4882a593Smuzhiyun track_free:
47*4882a593Smuzhiyun 	kvm_page_track_free_memslot(slot);
48*4882a593Smuzhiyun 	return -ENOMEM;
49*4882a593Smuzhiyun }
50*4882a593Smuzhiyun 
page_track_mode_is_valid(enum kvm_page_track_mode mode)51*4882a593Smuzhiyun static inline bool page_track_mode_is_valid(enum kvm_page_track_mode mode)
52*4882a593Smuzhiyun {
53*4882a593Smuzhiyun 	if (mode < 0 || mode >= KVM_PAGE_TRACK_MAX)
54*4882a593Smuzhiyun 		return false;
55*4882a593Smuzhiyun 
56*4882a593Smuzhiyun 	return true;
57*4882a593Smuzhiyun }
58*4882a593Smuzhiyun 
update_gfn_track(struct kvm_memory_slot * slot,gfn_t gfn,enum kvm_page_track_mode mode,short count)59*4882a593Smuzhiyun static void update_gfn_track(struct kvm_memory_slot *slot, gfn_t gfn,
60*4882a593Smuzhiyun 			     enum kvm_page_track_mode mode, short count)
61*4882a593Smuzhiyun {
62*4882a593Smuzhiyun 	int index, val;
63*4882a593Smuzhiyun 
64*4882a593Smuzhiyun 	index = gfn_to_index(gfn, slot->base_gfn, PG_LEVEL_4K);
65*4882a593Smuzhiyun 
66*4882a593Smuzhiyun 	val = slot->arch.gfn_track[mode][index];
67*4882a593Smuzhiyun 
68*4882a593Smuzhiyun 	if (WARN_ON(val + count < 0 || val + count > USHRT_MAX))
69*4882a593Smuzhiyun 		return;
70*4882a593Smuzhiyun 
71*4882a593Smuzhiyun 	slot->arch.gfn_track[mode][index] += count;
72*4882a593Smuzhiyun }
73*4882a593Smuzhiyun 
74*4882a593Smuzhiyun /*
75*4882a593Smuzhiyun  * add guest page to the tracking pool so that corresponding access on that
76*4882a593Smuzhiyun  * page will be intercepted.
77*4882a593Smuzhiyun  *
78*4882a593Smuzhiyun  * It should be called under the protection both of mmu-lock and kvm->srcu
79*4882a593Smuzhiyun  * or kvm->slots_lock.
80*4882a593Smuzhiyun  *
81*4882a593Smuzhiyun  * @kvm: the guest instance we are interested in.
82*4882a593Smuzhiyun  * @slot: the @gfn belongs to.
83*4882a593Smuzhiyun  * @gfn: the guest page.
84*4882a593Smuzhiyun  * @mode: tracking mode, currently only write track is supported.
85*4882a593Smuzhiyun  */
kvm_slot_page_track_add_page(struct kvm * kvm,struct kvm_memory_slot * slot,gfn_t gfn,enum kvm_page_track_mode mode)86*4882a593Smuzhiyun void kvm_slot_page_track_add_page(struct kvm *kvm,
87*4882a593Smuzhiyun 				  struct kvm_memory_slot *slot, gfn_t gfn,
88*4882a593Smuzhiyun 				  enum kvm_page_track_mode mode)
89*4882a593Smuzhiyun {
90*4882a593Smuzhiyun 
91*4882a593Smuzhiyun 	if (WARN_ON(!page_track_mode_is_valid(mode)))
92*4882a593Smuzhiyun 		return;
93*4882a593Smuzhiyun 
94*4882a593Smuzhiyun 	update_gfn_track(slot, gfn, mode, 1);
95*4882a593Smuzhiyun 
96*4882a593Smuzhiyun 	/*
97*4882a593Smuzhiyun 	 * new track stops large page mapping for the
98*4882a593Smuzhiyun 	 * tracked page.
99*4882a593Smuzhiyun 	 */
100*4882a593Smuzhiyun 	kvm_mmu_gfn_disallow_lpage(slot, gfn);
101*4882a593Smuzhiyun 
102*4882a593Smuzhiyun 	if (mode == KVM_PAGE_TRACK_WRITE)
103*4882a593Smuzhiyun 		if (kvm_mmu_slot_gfn_write_protect(kvm, slot, gfn))
104*4882a593Smuzhiyun 			kvm_flush_remote_tlbs(kvm);
105*4882a593Smuzhiyun }
106*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(kvm_slot_page_track_add_page);
107*4882a593Smuzhiyun 
108*4882a593Smuzhiyun /*
109*4882a593Smuzhiyun  * remove the guest page from the tracking pool which stops the interception
110*4882a593Smuzhiyun  * of corresponding access on that page. It is the opposed operation of
111*4882a593Smuzhiyun  * kvm_slot_page_track_add_page().
112*4882a593Smuzhiyun  *
113*4882a593Smuzhiyun  * It should be called under the protection both of mmu-lock and kvm->srcu
114*4882a593Smuzhiyun  * or kvm->slots_lock.
115*4882a593Smuzhiyun  *
116*4882a593Smuzhiyun  * @kvm: the guest instance we are interested in.
117*4882a593Smuzhiyun  * @slot: the @gfn belongs to.
118*4882a593Smuzhiyun  * @gfn: the guest page.
119*4882a593Smuzhiyun  * @mode: tracking mode, currently only write track is supported.
120*4882a593Smuzhiyun  */
kvm_slot_page_track_remove_page(struct kvm * kvm,struct kvm_memory_slot * slot,gfn_t gfn,enum kvm_page_track_mode mode)121*4882a593Smuzhiyun void kvm_slot_page_track_remove_page(struct kvm *kvm,
122*4882a593Smuzhiyun 				     struct kvm_memory_slot *slot, gfn_t gfn,
123*4882a593Smuzhiyun 				     enum kvm_page_track_mode mode)
124*4882a593Smuzhiyun {
125*4882a593Smuzhiyun 	if (WARN_ON(!page_track_mode_is_valid(mode)))
126*4882a593Smuzhiyun 		return;
127*4882a593Smuzhiyun 
128*4882a593Smuzhiyun 	update_gfn_track(slot, gfn, mode, -1);
129*4882a593Smuzhiyun 
130*4882a593Smuzhiyun 	/*
131*4882a593Smuzhiyun 	 * allow large page mapping for the tracked page
132*4882a593Smuzhiyun 	 * after the tracker is gone.
133*4882a593Smuzhiyun 	 */
134*4882a593Smuzhiyun 	kvm_mmu_gfn_allow_lpage(slot, gfn);
135*4882a593Smuzhiyun }
136*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(kvm_slot_page_track_remove_page);
137*4882a593Smuzhiyun 
138*4882a593Smuzhiyun /*
139*4882a593Smuzhiyun  * check if the corresponding access on the specified guest page is tracked.
140*4882a593Smuzhiyun  */
kvm_page_track_is_active(struct kvm_vcpu * vcpu,gfn_t gfn,enum kvm_page_track_mode mode)141*4882a593Smuzhiyun bool kvm_page_track_is_active(struct kvm_vcpu *vcpu, gfn_t gfn,
142*4882a593Smuzhiyun 			      enum kvm_page_track_mode mode)
143*4882a593Smuzhiyun {
144*4882a593Smuzhiyun 	struct kvm_memory_slot *slot;
145*4882a593Smuzhiyun 	int index;
146*4882a593Smuzhiyun 
147*4882a593Smuzhiyun 	if (WARN_ON(!page_track_mode_is_valid(mode)))
148*4882a593Smuzhiyun 		return false;
149*4882a593Smuzhiyun 
150*4882a593Smuzhiyun 	slot = kvm_vcpu_gfn_to_memslot(vcpu, gfn);
151*4882a593Smuzhiyun 	if (!slot)
152*4882a593Smuzhiyun 		return false;
153*4882a593Smuzhiyun 
154*4882a593Smuzhiyun 	index = gfn_to_index(gfn, slot->base_gfn, PG_LEVEL_4K);
155*4882a593Smuzhiyun 	return !!READ_ONCE(slot->arch.gfn_track[mode][index]);
156*4882a593Smuzhiyun }
157*4882a593Smuzhiyun 
kvm_page_track_cleanup(struct kvm * kvm)158*4882a593Smuzhiyun void kvm_page_track_cleanup(struct kvm *kvm)
159*4882a593Smuzhiyun {
160*4882a593Smuzhiyun 	struct kvm_page_track_notifier_head *head;
161*4882a593Smuzhiyun 
162*4882a593Smuzhiyun 	head = &kvm->arch.track_notifier_head;
163*4882a593Smuzhiyun 	cleanup_srcu_struct(&head->track_srcu);
164*4882a593Smuzhiyun }
165*4882a593Smuzhiyun 
kvm_page_track_init(struct kvm * kvm)166*4882a593Smuzhiyun int kvm_page_track_init(struct kvm *kvm)
167*4882a593Smuzhiyun {
168*4882a593Smuzhiyun 	struct kvm_page_track_notifier_head *head;
169*4882a593Smuzhiyun 
170*4882a593Smuzhiyun 	head = &kvm->arch.track_notifier_head;
171*4882a593Smuzhiyun 	INIT_HLIST_HEAD(&head->track_notifier_list);
172*4882a593Smuzhiyun 	return init_srcu_struct(&head->track_srcu);
173*4882a593Smuzhiyun }
174*4882a593Smuzhiyun 
175*4882a593Smuzhiyun /*
176*4882a593Smuzhiyun  * register the notifier so that event interception for the tracked guest
177*4882a593Smuzhiyun  * pages can be received.
178*4882a593Smuzhiyun  */
179*4882a593Smuzhiyun void
kvm_page_track_register_notifier(struct kvm * kvm,struct kvm_page_track_notifier_node * n)180*4882a593Smuzhiyun kvm_page_track_register_notifier(struct kvm *kvm,
181*4882a593Smuzhiyun 				 struct kvm_page_track_notifier_node *n)
182*4882a593Smuzhiyun {
183*4882a593Smuzhiyun 	struct kvm_page_track_notifier_head *head;
184*4882a593Smuzhiyun 
185*4882a593Smuzhiyun 	head = &kvm->arch.track_notifier_head;
186*4882a593Smuzhiyun 
187*4882a593Smuzhiyun 	spin_lock(&kvm->mmu_lock);
188*4882a593Smuzhiyun 	hlist_add_head_rcu(&n->node, &head->track_notifier_list);
189*4882a593Smuzhiyun 	spin_unlock(&kvm->mmu_lock);
190*4882a593Smuzhiyun }
191*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(kvm_page_track_register_notifier);
192*4882a593Smuzhiyun 
193*4882a593Smuzhiyun /*
194*4882a593Smuzhiyun  * stop receiving the event interception. It is the opposed operation of
195*4882a593Smuzhiyun  * kvm_page_track_register_notifier().
196*4882a593Smuzhiyun  */
197*4882a593Smuzhiyun void
kvm_page_track_unregister_notifier(struct kvm * kvm,struct kvm_page_track_notifier_node * n)198*4882a593Smuzhiyun kvm_page_track_unregister_notifier(struct kvm *kvm,
199*4882a593Smuzhiyun 				   struct kvm_page_track_notifier_node *n)
200*4882a593Smuzhiyun {
201*4882a593Smuzhiyun 	struct kvm_page_track_notifier_head *head;
202*4882a593Smuzhiyun 
203*4882a593Smuzhiyun 	head = &kvm->arch.track_notifier_head;
204*4882a593Smuzhiyun 
205*4882a593Smuzhiyun 	spin_lock(&kvm->mmu_lock);
206*4882a593Smuzhiyun 	hlist_del_rcu(&n->node);
207*4882a593Smuzhiyun 	spin_unlock(&kvm->mmu_lock);
208*4882a593Smuzhiyun 	synchronize_srcu(&head->track_srcu);
209*4882a593Smuzhiyun }
210*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(kvm_page_track_unregister_notifier);
211*4882a593Smuzhiyun 
212*4882a593Smuzhiyun /*
213*4882a593Smuzhiyun  * Notify the node that write access is intercepted and write emulation is
214*4882a593Smuzhiyun  * finished at this time.
215*4882a593Smuzhiyun  *
216*4882a593Smuzhiyun  * The node should figure out if the written page is the one that node is
217*4882a593Smuzhiyun  * interested in by itself.
218*4882a593Smuzhiyun  */
kvm_page_track_write(struct kvm_vcpu * vcpu,gpa_t gpa,const u8 * new,int bytes)219*4882a593Smuzhiyun void kvm_page_track_write(struct kvm_vcpu *vcpu, gpa_t gpa, const u8 *new,
220*4882a593Smuzhiyun 			  int bytes)
221*4882a593Smuzhiyun {
222*4882a593Smuzhiyun 	struct kvm_page_track_notifier_head *head;
223*4882a593Smuzhiyun 	struct kvm_page_track_notifier_node *n;
224*4882a593Smuzhiyun 	int idx;
225*4882a593Smuzhiyun 
226*4882a593Smuzhiyun 	head = &vcpu->kvm->arch.track_notifier_head;
227*4882a593Smuzhiyun 
228*4882a593Smuzhiyun 	if (hlist_empty(&head->track_notifier_list))
229*4882a593Smuzhiyun 		return;
230*4882a593Smuzhiyun 
231*4882a593Smuzhiyun 	idx = srcu_read_lock(&head->track_srcu);
232*4882a593Smuzhiyun 	hlist_for_each_entry_srcu(n, &head->track_notifier_list, node,
233*4882a593Smuzhiyun 				srcu_read_lock_held(&head->track_srcu))
234*4882a593Smuzhiyun 		if (n->track_write)
235*4882a593Smuzhiyun 			n->track_write(vcpu, gpa, new, bytes, n);
236*4882a593Smuzhiyun 	srcu_read_unlock(&head->track_srcu, idx);
237*4882a593Smuzhiyun }
238*4882a593Smuzhiyun 
239*4882a593Smuzhiyun /*
240*4882a593Smuzhiyun  * Notify the node that memory slot is being removed or moved so that it can
241*4882a593Smuzhiyun  * drop write-protection for the pages in the memory slot.
242*4882a593Smuzhiyun  *
243*4882a593Smuzhiyun  * The node should figure out it has any write-protected pages in this slot
244*4882a593Smuzhiyun  * by itself.
245*4882a593Smuzhiyun  */
kvm_page_track_flush_slot(struct kvm * kvm,struct kvm_memory_slot * slot)246*4882a593Smuzhiyun void kvm_page_track_flush_slot(struct kvm *kvm, struct kvm_memory_slot *slot)
247*4882a593Smuzhiyun {
248*4882a593Smuzhiyun 	struct kvm_page_track_notifier_head *head;
249*4882a593Smuzhiyun 	struct kvm_page_track_notifier_node *n;
250*4882a593Smuzhiyun 	int idx;
251*4882a593Smuzhiyun 
252*4882a593Smuzhiyun 	head = &kvm->arch.track_notifier_head;
253*4882a593Smuzhiyun 
254*4882a593Smuzhiyun 	if (hlist_empty(&head->track_notifier_list))
255*4882a593Smuzhiyun 		return;
256*4882a593Smuzhiyun 
257*4882a593Smuzhiyun 	idx = srcu_read_lock(&head->track_srcu);
258*4882a593Smuzhiyun 	hlist_for_each_entry_srcu(n, &head->track_notifier_list, node,
259*4882a593Smuzhiyun 				srcu_read_lock_held(&head->track_srcu))
260*4882a593Smuzhiyun 		if (n->track_flush_slot)
261*4882a593Smuzhiyun 			n->track_flush_slot(kvm, slot, n);
262*4882a593Smuzhiyun 	srcu_read_unlock(&head->track_srcu, idx);
263*4882a593Smuzhiyun }
264