forked from Minki/linux
KVM: x86: Fix wall clock writes in Xen shared_info not to mark page dirty
When dirty ring logging is enabled, any dirty logging without an active
vCPU context will cause a kernel oops. But we've already declared that
the shared_info page doesn't get dirty tracking anyway, since it would
be kind of insane to mark it dirty every time we deliver an event channel
interrupt. Userspace is supposed to just assume it's always dirty any
time a vCPU can run or event channels are routed.
So stop using the generic kvm_write_wall_clock() and just write directly
through the gfn_to_pfn_cache that we already have set up.
We can make kvm_write_wall_clock() static in x86.c again now, but let's
not remove the 'sec_hi_ofs' argument even though it's not used yet. At
some point we *will* want to use that for KVM guests too.
Fixes: 629b534884
("KVM: x86/xen: update wallclock region")
Reported-by: butt3rflyh4ck <butterflyhuangxx@gmail.com>
Signed-off-by: David Woodhouse <dwmw@amazon.co.uk>
Message-Id: <20211210163625.2886-6-dwmw2@infradead.org>
Signed-off-by: Paolo Bonzini <pbonzini@redhat.com>
This commit is contained in:
parent
14243b3871
commit
55749769fe
@ -2135,7 +2135,7 @@ static s64 get_kvmclock_base_ns(void)
|
|||||||
}
|
}
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
void kvm_write_wall_clock(struct kvm *kvm, gpa_t wall_clock, int sec_hi_ofs)
|
static void kvm_write_wall_clock(struct kvm *kvm, gpa_t wall_clock, int sec_hi_ofs)
|
||||||
{
|
{
|
||||||
int version;
|
int version;
|
||||||
int r;
|
int r;
|
||||||
|
@ -301,7 +301,6 @@ static inline bool kvm_vcpu_latch_init(struct kvm_vcpu *vcpu)
|
|||||||
return is_smm(vcpu) || static_call(kvm_x86_apic_init_signal_blocked)(vcpu);
|
return is_smm(vcpu) || static_call(kvm_x86_apic_init_signal_blocked)(vcpu);
|
||||||
}
|
}
|
||||||
|
|
||||||
void kvm_write_wall_clock(struct kvm *kvm, gpa_t wall_clock, int sec_hi_ofs);
|
|
||||||
void kvm_inject_realmode_interrupt(struct kvm_vcpu *vcpu, int irq, int inc_eip);
|
void kvm_inject_realmode_interrupt(struct kvm_vcpu *vcpu, int irq, int inc_eip);
|
||||||
|
|
||||||
u64 get_kvmclock_ns(struct kvm *kvm);
|
u64 get_kvmclock_ns(struct kvm *kvm);
|
||||||
|
@ -25,8 +25,11 @@ DEFINE_STATIC_KEY_DEFERRED_FALSE(kvm_xen_enabled, HZ);
|
|||||||
static int kvm_xen_shared_info_init(struct kvm *kvm, gfn_t gfn)
|
static int kvm_xen_shared_info_init(struct kvm *kvm, gfn_t gfn)
|
||||||
{
|
{
|
||||||
struct gfn_to_pfn_cache *gpc = &kvm->arch.xen.shinfo_cache;
|
struct gfn_to_pfn_cache *gpc = &kvm->arch.xen.shinfo_cache;
|
||||||
|
struct pvclock_wall_clock *wc;
|
||||||
gpa_t gpa = gfn_to_gpa(gfn);
|
gpa_t gpa = gfn_to_gpa(gfn);
|
||||||
int wc_ofs, sec_hi_ofs;
|
u32 *wc_sec_hi;
|
||||||
|
u32 wc_version;
|
||||||
|
u64 wall_nsec;
|
||||||
int ret = 0;
|
int ret = 0;
|
||||||
int idx = srcu_read_lock(&kvm->srcu);
|
int idx = srcu_read_lock(&kvm->srcu);
|
||||||
|
|
||||||
@ -35,32 +38,63 @@ static int kvm_xen_shared_info_init(struct kvm *kvm, gfn_t gfn)
|
|||||||
goto out;
|
goto out;
|
||||||
}
|
}
|
||||||
|
|
||||||
ret = kvm_gfn_to_pfn_cache_init(kvm, gpc, NULL, false, true, gpa,
|
do {
|
||||||
PAGE_SIZE, false);
|
ret = kvm_gfn_to_pfn_cache_init(kvm, gpc, NULL, false, true,
|
||||||
if (ret)
|
gpa, PAGE_SIZE, false);
|
||||||
goto out;
|
if (ret)
|
||||||
|
goto out;
|
||||||
|
|
||||||
|
/*
|
||||||
|
* This code mirrors kvm_write_wall_clock() except that it writes
|
||||||
|
* directly through the pfn cache and doesn't mark the page dirty.
|
||||||
|
*/
|
||||||
|
wall_nsec = ktime_get_real_ns() - get_kvmclock_ns(kvm);
|
||||||
|
|
||||||
|
/* It could be invalid again already, so we need to check */
|
||||||
|
read_lock_irq(&gpc->lock);
|
||||||
|
|
||||||
|
if (gpc->valid)
|
||||||
|
break;
|
||||||
|
|
||||||
|
read_unlock_irq(&gpc->lock);
|
||||||
|
} while (1);
|
||||||
|
|
||||||
/* Paranoia checks on the 32-bit struct layout */
|
/* Paranoia checks on the 32-bit struct layout */
|
||||||
BUILD_BUG_ON(offsetof(struct compat_shared_info, wc) != 0x900);
|
BUILD_BUG_ON(offsetof(struct compat_shared_info, wc) != 0x900);
|
||||||
BUILD_BUG_ON(offsetof(struct compat_shared_info, arch.wc_sec_hi) != 0x924);
|
BUILD_BUG_ON(offsetof(struct compat_shared_info, arch.wc_sec_hi) != 0x924);
|
||||||
BUILD_BUG_ON(offsetof(struct pvclock_vcpu_time_info, version) != 0);
|
BUILD_BUG_ON(offsetof(struct pvclock_vcpu_time_info, version) != 0);
|
||||||
|
|
||||||
/* 32-bit location by default */
|
|
||||||
wc_ofs = offsetof(struct compat_shared_info, wc);
|
|
||||||
sec_hi_ofs = offsetof(struct compat_shared_info, arch.wc_sec_hi);
|
|
||||||
|
|
||||||
#ifdef CONFIG_X86_64
|
#ifdef CONFIG_X86_64
|
||||||
/* Paranoia checks on the 64-bit struct layout */
|
/* Paranoia checks on the 64-bit struct layout */
|
||||||
BUILD_BUG_ON(offsetof(struct shared_info, wc) != 0xc00);
|
BUILD_BUG_ON(offsetof(struct shared_info, wc) != 0xc00);
|
||||||
BUILD_BUG_ON(offsetof(struct shared_info, wc_sec_hi) != 0xc0c);
|
BUILD_BUG_ON(offsetof(struct shared_info, wc_sec_hi) != 0xc0c);
|
||||||
|
|
||||||
if (kvm->arch.xen.long_mode) {
|
if (IS_ENABLED(CONFIG_64BIT) && kvm->arch.xen.long_mode) {
|
||||||
wc_ofs = offsetof(struct shared_info, wc);
|
struct shared_info *shinfo = gpc->khva;
|
||||||
sec_hi_ofs = offsetof(struct shared_info, wc_sec_hi);
|
|
||||||
}
|
wc_sec_hi = &shinfo->wc_sec_hi;
|
||||||
#endif
|
wc = &shinfo->wc;
|
||||||
|
} else
|
||||||
|
#endif
|
||||||
|
{
|
||||||
|
struct compat_shared_info *shinfo = gpc->khva;
|
||||||
|
|
||||||
|
wc_sec_hi = &shinfo->arch.wc_sec_hi;
|
||||||
|
wc = &shinfo->wc;
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Increment and ensure an odd value */
|
||||||
|
wc_version = wc->version = (wc->version + 1) | 1;
|
||||||
|
smp_wmb();
|
||||||
|
|
||||||
|
wc->nsec = do_div(wall_nsec, 1000000000);
|
||||||
|
wc->sec = (u32)wall_nsec;
|
||||||
|
*wc_sec_hi = wall_nsec >> 32;
|
||||||
|
smp_wmb();
|
||||||
|
|
||||||
|
wc->version = wc_version + 1;
|
||||||
|
read_unlock_irq(&gpc->lock);
|
||||||
|
|
||||||
kvm_write_wall_clock(kvm, gpa + wc_ofs, sec_hi_ofs - wc_ofs);
|
|
||||||
kvm_make_all_cpus_request(kvm, KVM_REQ_MASTERCLOCK_UPDATE);
|
kvm_make_all_cpus_request(kvm, KVM_REQ_MASTERCLOCK_UPDATE);
|
||||||
|
|
||||||
out:
|
out:
|
||||||
|
Loading…
Reference in New Issue
Block a user