Skip to content

Commit 81576a9

Browse files
committed
Merge tag 'for-linus' of git://git.kernel.org/pub/scm/virt/kvm/kvm
Pull kvm fixes from Paolo Bonzini: "ARM64: - Fix confusion with implicitly-shifted MDCR_EL2 masks breaking SPE/TRBE initialization - Align nested page table walker with the intended memory attribute combining rules of the architecture - Prevent userspace from constraining the advertised ASID width, avoiding horrors of guest TLBIs not matching the intended context in hardware - Don't leak references on LPIs when insertion into the translation cache fails RISC-V: - Replace csr_write() with csr_set() for HVIEN PMU overflow bit x86: - Cache CPUID.0xD XSTATE offsets+sizes during module init On Intel's Emerald Rapids CPUID costs hundreds of cycles and there are a lot of leaves under 0xD. Getting rid of the CPUIDs during nested VM-Enter and VM-Exit is planned for the next release, for now just cache them: even on Skylake that is 40% faster" * tag 'for-linus' of git://git.kernel.org/pub/scm/virt/kvm/kvm: KVM: x86: Cache CPUID.0xD XSTATE offsets+sizes during module init RISC-V: KVM: Fix csr_write -> csr_set for HVIEN PMU overflow bit KVM: arm64: vgic-its: Add error handling in vgic_its_cache_translation KVM: arm64: Do not allow ID_AA64MMFR0_EL1.ASIDbits to be overridden KVM: arm64: Fix S1/S2 combination when FWB==1 and S2 has Device memory type arm64: Fix usage of new shifted MDCR_EL2 values
2 parents 2d8308b + 3522c41 commit 81576a9

File tree

10 files changed

+58
-16
lines changed

10 files changed

+58
-16
lines changed

arch/arm64/include/asm/el2_setup.h

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -87,7 +87,7 @@
8787
1 << PMSCR_EL2_PA_SHIFT)
8888
msr_s SYS_PMSCR_EL2, x0 // addresses and physical counter
8989
.Lskip_spe_el2_\@:
90-
mov x0, #(MDCR_EL2_E2PB_MASK << MDCR_EL2_E2PB_SHIFT)
90+
mov x0, #MDCR_EL2_E2PB_MASK
9191
orr x2, x2, x0 // If we don't have VHE, then
9292
// use EL1&0 translation.
9393

@@ -100,7 +100,7 @@
100100
and x0, x0, TRBIDR_EL1_P
101101
cbnz x0, .Lskip_trace_\@ // If TRBE is available at EL2
102102

103-
mov x0, #(MDCR_EL2_E2TB_MASK << MDCR_EL2_E2TB_SHIFT)
103+
mov x0, #MDCR_EL2_E2TB_MASK
104104
orr x2, x2, x0 // allow the EL1&0 translation
105105
// to own it.
106106

arch/arm64/kernel/hyp-stub.S

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -114,8 +114,8 @@ SYM_CODE_START_LOCAL(__finalise_el2)
114114

115115
// Use EL2 translations for SPE & TRBE and disable access from EL1
116116
mrs x0, mdcr_el2
117-
bic x0, x0, #(MDCR_EL2_E2PB_MASK << MDCR_EL2_E2PB_SHIFT)
118-
bic x0, x0, #(MDCR_EL2_E2TB_MASK << MDCR_EL2_E2TB_SHIFT)
117+
bic x0, x0, #MDCR_EL2_E2PB_MASK
118+
bic x0, x0, #MDCR_EL2_E2TB_MASK
119119
msr mdcr_el2, x0
120120

121121
// Transfer the MM state from EL1 to EL2

arch/arm64/kvm/at.c

Lines changed: 9 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -739,8 +739,15 @@ static u64 compute_par_s12(struct kvm_vcpu *vcpu, u64 s1_par,
739739
final_attr = s1_parattr;
740740
break;
741741
default:
742-
/* MemAttr[2]=0, Device from S2 */
743-
final_attr = s2_memattr & GENMASK(1,0) << 2;
742+
/*
743+
* MemAttr[2]=0, Device from S2.
744+
*
745+
* FWB does not influence the way that stage 1
746+
* memory types and attributes are combined
747+
* with stage 2 Device type and attributes.
748+
*/
749+
final_attr = min(s2_memattr_to_attr(s2_memattr),
750+
s1_parattr);
744751
}
745752
} else {
746753
/* Combination of R_HMNDG, R_TNHFM and R_GQFSF */

arch/arm64/kvm/hyp/nvhe/pkvm.c

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -126,7 +126,7 @@ static void pvm_init_traps_aa64dfr0(struct kvm_vcpu *vcpu)
126126
/* Trap SPE */
127127
if (!FIELD_GET(ARM64_FEATURE_MASK(ID_AA64DFR0_EL1_PMSVer), feature_ids)) {
128128
mdcr_set |= MDCR_EL2_TPMS;
129-
mdcr_clear |= MDCR_EL2_E2PB_MASK << MDCR_EL2_E2PB_SHIFT;
129+
mdcr_clear |= MDCR_EL2_E2PB_MASK;
130130
}
131131

132132
/* Trap Trace Filter */
@@ -143,7 +143,7 @@ static void pvm_init_traps_aa64dfr0(struct kvm_vcpu *vcpu)
143143

144144
/* Trap External Trace */
145145
if (!FIELD_GET(ARM64_FEATURE_MASK(ID_AA64DFR0_EL1_ExtTrcBuff), feature_ids))
146-
mdcr_clear |= MDCR_EL2_E2TB_MASK << MDCR_EL2_E2TB_SHIFT;
146+
mdcr_clear |= MDCR_EL2_E2TB_MASK;
147147

148148
vcpu->arch.mdcr_el2 |= mdcr_set;
149149
vcpu->arch.mdcr_el2 &= ~mdcr_clear;

arch/arm64/kvm/sys_regs.c

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2618,7 +2618,8 @@ static const struct sys_reg_desc sys_reg_descs[] = {
26182618
ID_WRITABLE(ID_AA64MMFR0_EL1, ~(ID_AA64MMFR0_EL1_RES0 |
26192619
ID_AA64MMFR0_EL1_TGRAN4_2 |
26202620
ID_AA64MMFR0_EL1_TGRAN64_2 |
2621-
ID_AA64MMFR0_EL1_TGRAN16_2)),
2621+
ID_AA64MMFR0_EL1_TGRAN16_2 |
2622+
ID_AA64MMFR0_EL1_ASIDBITS)),
26222623
ID_WRITABLE(ID_AA64MMFR1_EL1, ~(ID_AA64MMFR1_EL1_RES0 |
26232624
ID_AA64MMFR1_EL1_HCX |
26242625
ID_AA64MMFR1_EL1_TWED |

arch/arm64/kvm/vgic/vgic-its.c

Lines changed: 11 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -608,12 +608,22 @@ static void vgic_its_cache_translation(struct kvm *kvm, struct vgic_its *its,
608608
lockdep_assert_held(&its->its_lock);
609609
vgic_get_irq_kref(irq);
610610

611+
old = xa_store(&its->translation_cache, cache_key, irq, GFP_KERNEL_ACCOUNT);
612+
613+
/*
614+
* Put the reference taken on @irq if the store fails. Intentionally do
615+
* not return the error as the translation cache is best effort.
616+
*/
617+
if (xa_is_err(old)) {
618+
vgic_put_irq(kvm, irq);
619+
return;
620+
}
621+
611622
/*
612623
* We could have raced with another CPU caching the same
613624
* translation behind our back, ensure we don't leak a
614625
* reference if that is the case.
615626
*/
616-
old = xa_store(&its->translation_cache, cache_key, irq, GFP_KERNEL_ACCOUNT);
617627
if (old)
618628
vgic_put_irq(kvm, old);
619629
}

arch/riscv/kvm/aia.c

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -590,7 +590,7 @@ void kvm_riscv_aia_enable(void)
590590
csr_set(CSR_HIE, BIT(IRQ_S_GEXT));
591591
/* Enable IRQ filtering for overflow interrupt only if sscofpmf is present */
592592
if (__riscv_isa_extension_available(NULL, RISCV_ISA_EXT_SSCOFPMF))
593-
csr_write(CSR_HVIEN, BIT(IRQ_PMU_OVF));
593+
csr_set(CSR_HVIEN, BIT(IRQ_PMU_OVF));
594594
}
595595

596596
void kvm_riscv_aia_disable(void)

arch/x86/kvm/cpuid.c

Lines changed: 26 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -36,6 +36,26 @@
3636
u32 kvm_cpu_caps[NR_KVM_CPU_CAPS] __read_mostly;
3737
EXPORT_SYMBOL_GPL(kvm_cpu_caps);
3838

39+
struct cpuid_xstate_sizes {
40+
u32 eax;
41+
u32 ebx;
42+
u32 ecx;
43+
};
44+
45+
static struct cpuid_xstate_sizes xstate_sizes[XFEATURE_MAX] __ro_after_init;
46+
47+
void __init kvm_init_xstate_sizes(void)
48+
{
49+
u32 ign;
50+
int i;
51+
52+
for (i = XFEATURE_YMM; i < ARRAY_SIZE(xstate_sizes); i++) {
53+
struct cpuid_xstate_sizes *xs = &xstate_sizes[i];
54+
55+
cpuid_count(0xD, i, &xs->eax, &xs->ebx, &xs->ecx, &ign);
56+
}
57+
}
58+
3959
u32 xstate_required_size(u64 xstate_bv, bool compacted)
4060
{
4161
int feature_bit = 0;
@@ -44,14 +64,15 @@ u32 xstate_required_size(u64 xstate_bv, bool compacted)
4464
xstate_bv &= XFEATURE_MASK_EXTEND;
4565
while (xstate_bv) {
4666
if (xstate_bv & 0x1) {
47-
u32 eax, ebx, ecx, edx, offset;
48-
cpuid_count(0xD, feature_bit, &eax, &ebx, &ecx, &edx);
67+
struct cpuid_xstate_sizes *xs = &xstate_sizes[feature_bit];
68+
u32 offset;
69+
4970
/* ECX[1]: 64B alignment in compacted form */
5071
if (compacted)
51-
offset = (ecx & 0x2) ? ALIGN(ret, 64) : ret;
72+
offset = (xs->ecx & 0x2) ? ALIGN(ret, 64) : ret;
5273
else
53-
offset = ebx;
54-
ret = max(ret, offset + eax);
74+
offset = xs->ebx;
75+
ret = max(ret, offset + xs->eax);
5576
}
5677

5778
xstate_bv >>= 1;

arch/x86/kvm/cpuid.h

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -31,6 +31,7 @@ int kvm_vcpu_ioctl_get_cpuid2(struct kvm_vcpu *vcpu,
3131
bool kvm_cpuid(struct kvm_vcpu *vcpu, u32 *eax, u32 *ebx,
3232
u32 *ecx, u32 *edx, bool exact_only);
3333

34+
void __init kvm_init_xstate_sizes(void);
3435
u32 xstate_required_size(u64 xstate_bv, bool compacted);
3536

3637
int cpuid_query_maxphyaddr(struct kvm_vcpu *vcpu);

arch/x86/kvm/x86.c

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -13997,6 +13997,8 @@ EXPORT_TRACEPOINT_SYMBOL_GPL(kvm_rmp_fault);
1399713997

1399813998
static int __init kvm_x86_init(void)
1399913999
{
14000+
kvm_init_xstate_sizes();
14001+
1400014002
kvm_mmu_x86_module_init();
1400114003
mitigate_smt_rsb &= boot_cpu_has_bug(X86_BUG_SMT_RSB) && cpu_smt_possible();
1400214004
return 0;

0 commit comments

Comments
 (0)