Skip to content

Commit 338068b

Browse files
sean-jcbonzini
authored andcommitted
KVM: x86/mmu: Drop infrastructure for multiple page-track modes
Drop "support" for multiple page-track modes, as there is no evidence that array-based and refcounted metadata is the optimal solution for other modes, nor is there any evidence that other use cases, e.g. for access-tracking, will be a good fit for the page-track machinery in general. E.g. one potential use case of access-tracking would be to prevent guest access to poisoned memory (from the guest's perspective). In that case, the number of poisoned pages is likely to be a very small percentage of the guest memory, and there is no need to reference count the number of access-tracking users, i.e. expanding gfn_track[] for a new mode would be grossly inefficient. And for poisoned memory, host userspace would also likely want to trap accesses, e.g. to inject #MC into the guest, and that isn't currently supported by the page-track framework. A better alternative for that poisoned page use case is likely a variation of the proposed per-gfn attributes overlay (linked), which would allow efficiently tracking the sparse set of poisoned pages, and by default would exit to userspace on access. Link: https://lore.kernel.org/all/Y2WB48kD0J4VGynX@google.com Cc: Ben Gardon <bgardon@google.com> Tested-by: Yongwei Ma <yongwei.ma@intel.com> Link: https://lore.kernel.org/r/20230729013535.1070024-24-seanjc@google.com Signed-off-by: Sean Christopherson <seanjc@google.com> Signed-off-by: Paolo Bonzini <pbonzini@redhat.com>
1 parent e998fb1 commit 338068b

File tree

6 files changed

+48
-102
lines changed

6 files changed

+48
-102
lines changed

arch/x86/include/asm/kvm_host.h

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -288,13 +288,13 @@ struct kvm_kernel_irq_routing_entry;
288288
* kvm_mmu_page_role tracks the properties of a shadow page (where shadow page
289289
* also includes TDP pages) to determine whether or not a page can be used in
290290
* the given MMU context. This is a subset of the overall kvm_cpu_role to
291-
* minimize the size of kvm_memory_slot.arch.gfn_track, i.e. allows allocating
292-
* 2 bytes per gfn instead of 4 bytes per gfn.
291+
* minimize the size of kvm_memory_slot.arch.gfn_write_track, i.e. allows
292+
* allocating 2 bytes per gfn instead of 4 bytes per gfn.
293293
*
294294
* Upper-level shadow pages having gptes are tracked for write-protection via
295-
* gfn_track. As above, gfn_track is a 16 bit counter, so KVM must not create
296-
* more than 2^16-1 upper-level shadow pages at a single gfn, otherwise
297-
* gfn_track will overflow and explosions will ensure.
295+
* gfn_write_track. As above, gfn_write_track is a 16 bit counter, so KVM must
296+
* not create more than 2^16-1 upper-level shadow pages at a single gfn,
297+
* otherwise gfn_write_track will overflow and explosions will ensue.
298298
*
299299
* A unique shadow page (SP) for a gfn is created if and only if an existing SP
300300
* cannot be reused. The ability to reuse a SP is tracked by its role, which
@@ -1023,7 +1023,7 @@ struct kvm_lpage_info {
10231023
struct kvm_arch_memory_slot {
10241024
struct kvm_rmap_head *rmap[KVM_NR_PAGE_SIZES];
10251025
struct kvm_lpage_info *lpage_info[KVM_NR_PAGE_SIZES - 1];
1026-
unsigned short *gfn_track[KVM_PAGE_TRACK_MAX];
1026+
unsigned short *gfn_write_track;
10271027
};
10281028

10291029
/*

arch/x86/include/asm/kvm_page_track.h

Lines changed: 2 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -4,17 +4,10 @@
44

55
#include <linux/kvm_types.h>
66

7-
enum kvm_page_track_mode {
8-
KVM_PAGE_TRACK_WRITE,
9-
KVM_PAGE_TRACK_MAX,
10-
};
11-
127
void kvm_slot_page_track_add_page(struct kvm *kvm,
13-
struct kvm_memory_slot *slot, gfn_t gfn,
14-
enum kvm_page_track_mode mode);
8+
struct kvm_memory_slot *slot, gfn_t gfn);
159
void kvm_slot_page_track_remove_page(struct kvm *kvm,
16-
struct kvm_memory_slot *slot, gfn_t gfn,
17-
enum kvm_page_track_mode mode);
10+
struct kvm_memory_slot *slot, gfn_t gfn);
1811

1912
#ifdef CONFIG_KVM_EXTERNAL_WRITE_TRACKING
2013
/*

arch/x86/kvm/mmu/mmu.c

Lines changed: 6 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -831,8 +831,7 @@ static void account_shadowed(struct kvm *kvm, struct kvm_mmu_page *sp)
831831

832832
/* the non-leaf shadow pages are keeping readonly. */
833833
if (sp->role.level > PG_LEVEL_4K)
834-
return kvm_slot_page_track_add_page(kvm, slot, gfn,
835-
KVM_PAGE_TRACK_WRITE);
834+
return kvm_slot_page_track_add_page(kvm, slot, gfn);
836835

837836
kvm_mmu_gfn_disallow_lpage(slot, gfn);
838837

@@ -878,8 +877,7 @@ static void unaccount_shadowed(struct kvm *kvm, struct kvm_mmu_page *sp)
878877
slots = kvm_memslots_for_spte_role(kvm, sp->role);
879878
slot = __gfn_to_memslot(slots, gfn);
880879
if (sp->role.level > PG_LEVEL_4K)
881-
return kvm_slot_page_track_remove_page(kvm, slot, gfn,
882-
KVM_PAGE_TRACK_WRITE);
880+
return kvm_slot_page_track_remove_page(kvm, slot, gfn);
883881

884882
kvm_mmu_gfn_allow_lpage(slot, gfn);
885883
}
@@ -2809,7 +2807,7 @@ int mmu_try_to_unsync_pages(struct kvm *kvm, const struct kvm_memory_slot *slot,
28092807
* track machinery is used to write-protect upper-level shadow pages,
28102808
* i.e. this guards the role.level == 4K assertion below!
28112809
*/
2812-
if (kvm_slot_page_track_is_active(kvm, slot, gfn, KVM_PAGE_TRACK_WRITE))
2810+
if (kvm_slot_page_track_is_active(kvm, slot, gfn))
28132811
return -EPERM;
28142812

28152813
/*
@@ -4203,7 +4201,7 @@ static bool page_fault_handle_page_track(struct kvm_vcpu *vcpu,
42034201
* guest is writing the page which is write tracked which can
42044202
* not be fixed by page fault handler.
42054203
*/
4206-
if (kvm_slot_page_track_is_active(vcpu->kvm, fault->slot, fault->gfn, KVM_PAGE_TRACK_WRITE))
4204+
if (kvm_slot_page_track_is_active(vcpu->kvm, fault->slot, fault->gfn))
42074205
return true;
42084206

42094207
return false;
@@ -5422,8 +5420,8 @@ void kvm_mmu_after_set_cpuid(struct kvm_vcpu *vcpu)
54225420
* physical address properties) in a single VM would require tracking
54235421
* all relevant CPUID information in kvm_mmu_page_role. That is very
54245422
* undesirable as it would increase the memory requirements for
5425-
* gfn_track (see struct kvm_mmu_page_role comments). For now that
5426-
* problem is swept under the rug; KVM's CPUID API is horrific and
5423+
* gfn_write_track (see struct kvm_mmu_page_role comments). For now
5424+
* that problem is swept under the rug; KVM's CPUID API is horrific and
54275425
* it's all but impossible to solve it without introducing a new API.
54285426
*/
54295427
vcpu->arch.root_mmu.root_role.word = 0;

arch/x86/kvm/mmu/page_track.c

Lines changed: 31 additions & 75 deletions
Original file line numberDiff line numberDiff line change
@@ -27,76 +27,50 @@ bool kvm_page_track_write_tracking_enabled(struct kvm *kvm)
2727

2828
void kvm_page_track_free_memslot(struct kvm_memory_slot *slot)
2929
{
30-
int i;
31-
32-
for (i = 0; i < KVM_PAGE_TRACK_MAX; i++) {
33-
kvfree(slot->arch.gfn_track[i]);
34-
slot->arch.gfn_track[i] = NULL;
35-
}
30+
kvfree(slot->arch.gfn_write_track);
31+
slot->arch.gfn_write_track = NULL;
3632
}
3733

38-
int kvm_page_track_create_memslot(struct kvm *kvm,
39-
struct kvm_memory_slot *slot,
40-
unsigned long npages)
34+
static int __kvm_page_track_write_tracking_alloc(struct kvm_memory_slot *slot,
35+
unsigned long npages)
4136
{
42-
int i;
43-
44-
for (i = 0; i < KVM_PAGE_TRACK_MAX; i++) {
45-
if (i == KVM_PAGE_TRACK_WRITE &&
46-
!kvm_page_track_write_tracking_enabled(kvm))
47-
continue;
48-
49-
slot->arch.gfn_track[i] =
50-
__vcalloc(npages, sizeof(*slot->arch.gfn_track[i]),
51-
GFP_KERNEL_ACCOUNT);
52-
if (!slot->arch.gfn_track[i])
53-
goto track_free;
54-
}
37+
const size_t size = sizeof(*slot->arch.gfn_write_track);
5538

56-
return 0;
39+
if (!slot->arch.gfn_write_track)
40+
slot->arch.gfn_write_track = __vcalloc(npages, size,
41+
GFP_KERNEL_ACCOUNT);
5742

58-
track_free:
59-
kvm_page_track_free_memslot(slot);
60-
return -ENOMEM;
43+
return slot->arch.gfn_write_track ? 0 : -ENOMEM;
6144
}
6245

63-
static inline bool page_track_mode_is_valid(enum kvm_page_track_mode mode)
46+
int kvm_page_track_create_memslot(struct kvm *kvm,
47+
struct kvm_memory_slot *slot,
48+
unsigned long npages)
6449
{
65-
if (mode < 0 || mode >= KVM_PAGE_TRACK_MAX)
66-
return false;
50+
if (!kvm_page_track_write_tracking_enabled(kvm))
51+
return 0;
6752

68-
return true;
53+
return __kvm_page_track_write_tracking_alloc(slot, npages);
6954
}
7055

7156
int kvm_page_track_write_tracking_alloc(struct kvm_memory_slot *slot)
7257
{
73-
unsigned short *gfn_track;
74-
75-
if (slot->arch.gfn_track[KVM_PAGE_TRACK_WRITE])
76-
return 0;
77-
78-
gfn_track = __vcalloc(slot->npages, sizeof(*gfn_track),
79-
GFP_KERNEL_ACCOUNT);
80-
if (gfn_track == NULL)
81-
return -ENOMEM;
82-
83-
slot->arch.gfn_track[KVM_PAGE_TRACK_WRITE] = gfn_track;
84-
return 0;
58+
return __kvm_page_track_write_tracking_alloc(slot, slot->npages);
8559
}
8660

87-
static void update_gfn_track(struct kvm_memory_slot *slot, gfn_t gfn,
88-
enum kvm_page_track_mode mode, short count)
61+
static void update_gfn_write_track(struct kvm_memory_slot *slot, gfn_t gfn,
62+
short count)
8963
{
9064
int index, val;
9165

9266
index = gfn_to_index(gfn, slot->base_gfn, PG_LEVEL_4K);
9367

94-
val = slot->arch.gfn_track[mode][index];
68+
val = slot->arch.gfn_write_track[index];
9569

9670
if (WARN_ON_ONCE(val + count < 0 || val + count > USHRT_MAX))
9771
return;
9872

99-
slot->arch.gfn_track[mode][index] += count;
73+
slot->arch.gfn_write_track[index] += count;
10074
}
10175

10276
/*
@@ -109,31 +83,23 @@ static void update_gfn_track(struct kvm_memory_slot *slot, gfn_t gfn,
10983
* @kvm: the guest instance we are interested in.
11084
* @slot: the @gfn belongs to.
11185
* @gfn: the guest page.
112-
* @mode: tracking mode, currently only write track is supported.
11386
*/
11487
void kvm_slot_page_track_add_page(struct kvm *kvm,
115-
struct kvm_memory_slot *slot, gfn_t gfn,
116-
enum kvm_page_track_mode mode)
88+
struct kvm_memory_slot *slot, gfn_t gfn)
11789
{
118-
119-
if (WARN_ON_ONCE(!page_track_mode_is_valid(mode)))
90+
if (WARN_ON_ONCE(!kvm_page_track_write_tracking_enabled(kvm)))
12091
return;
12192

122-
if (WARN_ON_ONCE(mode == KVM_PAGE_TRACK_WRITE &&
123-
!kvm_page_track_write_tracking_enabled(kvm)))
124-
return;
125-
126-
update_gfn_track(slot, gfn, mode, 1);
93+
update_gfn_write_track(slot, gfn, 1);
12794

12895
/*
12996
* new track stops large page mapping for the
13097
* tracked page.
13198
*/
13299
kvm_mmu_gfn_disallow_lpage(slot, gfn);
133100

134-
if (mode == KVM_PAGE_TRACK_WRITE)
135-
if (kvm_mmu_slot_gfn_write_protect(kvm, slot, gfn, PG_LEVEL_4K))
136-
kvm_flush_remote_tlbs(kvm);
101+
if (kvm_mmu_slot_gfn_write_protect(kvm, slot, gfn, PG_LEVEL_4K))
102+
kvm_flush_remote_tlbs(kvm);
137103
}
138104
EXPORT_SYMBOL_GPL(kvm_slot_page_track_add_page);
139105

@@ -148,20 +114,14 @@ EXPORT_SYMBOL_GPL(kvm_slot_page_track_add_page);
148114
* @kvm: the guest instance we are interested in.
149115
* @slot: the @gfn belongs to.
150116
* @gfn: the guest page.
151-
* @mode: tracking mode, currently only write track is supported.
152117
*/
153118
void kvm_slot_page_track_remove_page(struct kvm *kvm,
154-
struct kvm_memory_slot *slot, gfn_t gfn,
155-
enum kvm_page_track_mode mode)
119+
struct kvm_memory_slot *slot, gfn_t gfn)
156120
{
157-
if (WARN_ON_ONCE(!page_track_mode_is_valid(mode)))
158-
return;
159-
160-
if (WARN_ON_ONCE(mode == KVM_PAGE_TRACK_WRITE &&
161-
!kvm_page_track_write_tracking_enabled(kvm)))
121+
if (WARN_ON_ONCE(!kvm_page_track_write_tracking_enabled(kvm)))
162122
return;
163123

164-
update_gfn_track(slot, gfn, mode, -1);
124+
update_gfn_write_track(slot, gfn, -1);
165125

166126
/*
167127
* allow large page mapping for the tracked page
@@ -176,22 +136,18 @@ EXPORT_SYMBOL_GPL(kvm_slot_page_track_remove_page);
176136
*/
177137
bool kvm_slot_page_track_is_active(struct kvm *kvm,
178138
const struct kvm_memory_slot *slot,
179-
gfn_t gfn, enum kvm_page_track_mode mode)
139+
gfn_t gfn)
180140
{
181141
int index;
182142

183-
if (WARN_ON_ONCE(!page_track_mode_is_valid(mode)))
184-
return false;
185-
186143
if (!slot)
187144
return false;
188145

189-
if (mode == KVM_PAGE_TRACK_WRITE &&
190-
!kvm_page_track_write_tracking_enabled(kvm))
146+
if (!kvm_page_track_write_tracking_enabled(kvm))
191147
return false;
192148

193149
index = gfn_to_index(gfn, slot->base_gfn, PG_LEVEL_4K);
194-
return !!READ_ONCE(slot->arch.gfn_track[mode][index]);
150+
return !!READ_ONCE(slot->arch.gfn_write_track[index]);
195151
}
196152

197153
#ifdef CONFIG_KVM_EXTERNAL_WRITE_TRACKING

arch/x86/kvm/mmu/page_track.h

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -16,8 +16,7 @@ int kvm_page_track_create_memslot(struct kvm *kvm,
1616
unsigned long npages);
1717

1818
bool kvm_slot_page_track_is_active(struct kvm *kvm,
19-
const struct kvm_memory_slot *slot,
20-
gfn_t gfn, enum kvm_page_track_mode mode);
19+
const struct kvm_memory_slot *slot, gfn_t gfn);
2120

2221
#ifdef CONFIG_KVM_EXTERNAL_WRITE_TRACKING
2322
int kvm_page_track_init(struct kvm *kvm);

drivers/gpu/drm/i915/gvt/kvmgt.c

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1564,7 +1564,7 @@ int intel_gvt_page_track_add(struct intel_vgpu *info, u64 gfn)
15641564
}
15651565

15661566
write_lock(&kvm->mmu_lock);
1567-
kvm_slot_page_track_add_page(kvm, slot, gfn, KVM_PAGE_TRACK_WRITE);
1567+
kvm_slot_page_track_add_page(kvm, slot, gfn);
15681568
write_unlock(&kvm->mmu_lock);
15691569

15701570
srcu_read_unlock(&kvm->srcu, idx);
@@ -1593,7 +1593,7 @@ int intel_gvt_page_track_remove(struct intel_vgpu *info, u64 gfn)
15931593
}
15941594

15951595
write_lock(&kvm->mmu_lock);
1596-
kvm_slot_page_track_remove_page(kvm, slot, gfn, KVM_PAGE_TRACK_WRITE);
1596+
kvm_slot_page_track_remove_page(kvm, slot, gfn);
15971597
write_unlock(&kvm->mmu_lock);
15981598
srcu_read_unlock(&kvm->srcu, idx);
15991599

0 commit comments

Comments
 (0)