diff mbox

[v3] KVM: LAPIC: Fix lapic timer injection delay

Message ID 68c0d7f8-683f-c7fa-b328-e90e8dd9a789@redhat.com (mailing list archive)
State New, archived
Headers show

Commit Message

Paolo Bonzini June 28, 2017, 12:10 p.m. UTC
On 28/06/2017 03:29, Wanpeng Li wrote:
>  	u64 tscdeadline = apic->lapic_timer.tscdeadline;
> +	int ret = 0;
>  
>  	if ((atomic_read(&apic->lapic_timer.pending) &&
>  		!apic_lvtt_period(apic)) ||
> -		kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline)) {
> +		(ret = kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline))) {
>  		if (apic->lapic_timer.hv_timer_in_use)
>  			cancel_hv_timer(apic);
> +		if (ret == 1) {
> +			apic_timer_expired(apic);
> +			return true;
> +		}

The preemption timer can also be used for modes other than TSC deadline.

In periodic mode, your patch would miss a call to
advance_periodic_target_expiration, which is only called by
kvm_lapic_expired_hv_timer.

You could use something like this:


but I'm afraid of introducing a mutual recursion between
start_hv_timer and kvm_lapic_expired_hv_timer.

Paolo

Comments

Wanpeng Li June 28, 2017, 1:55 p.m. UTC | #1
2017-06-28 20:10 GMT+08:00 Paolo Bonzini <pbonzini@redhat.com>:
>
>
> On 28/06/2017 03:29, Wanpeng Li wrote:
>>       u64 tscdeadline = apic->lapic_timer.tscdeadline;
>> +     int ret = 0;
>>
>>       if ((atomic_read(&apic->lapic_timer.pending) &&
>>               !apic_lvtt_period(apic)) ||
>> -             kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline)) {
>> +             (ret = kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline))) {
>>               if (apic->lapic_timer.hv_timer_in_use)
>>                       cancel_hv_timer(apic);
>> +             if (ret == 1) {
>> +                     apic_timer_expired(apic);
>> +                     return true;
>> +             }
>
> The preemption timer can also be used for modes other than TSC deadline.
>
> In periodic mode, your patch would miss a call to
> advance_periodic_target_expiration, which is only called by
> kvm_lapic_expired_hv_timer.

Actually I considered this before, however, I referred to apic timer
periodic mode which is emulated by hrtimer, there is no hrtimer start
for the next period in start_sw_period(). If it is also buggy?

Regards,
Wanpeng Li

>
> You could use something like this:
>
> diff --git a/arch/x86/kvm/lapic.c b/arch/x86/kvm/lapic.c
> index d24c8742d9b0..15b751aa7625 100644
> --- a/arch/x86/kvm/lapic.c
> +++ b/arch/x86/kvm/lapic.c
> @@ -1504,21 +1504,26 @@ static void cancel_hv_timer(struct kvm_lapic *apic)
>  static bool start_hv_timer(struct kvm_lapic *apic)
>  {
>         u64 tscdeadline = apic->lapic_timer.tscdeadline;
> +       bool need_cancel = apic->lapic_timer.hv_timer_in_use;
> +       if (!atomic_read(&apic->lapic_timer.pending) || apic_lvtt_period(apic)) {
> +               int r = kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline);
> +               if (r >= 0) {
> +                       need_cancel = false;
> +                       apic->lapic_timer.hv_timer_in_use = true;
> +                       hrtimer_cancel(&apic->lapic_timer.timer);
>
> -       if ((atomic_read(&apic->lapic_timer.pending) &&
> -               !apic_lvtt_period(apic)) ||
> -               kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline)) {
> -               if (apic->lapic_timer.hv_timer_in_use)
> -                       cancel_hv_timer(apic);
> -       } else {
> -               apic->lapic_timer.hv_timer_in_use = true;
> -               hrtimer_cancel(&apic->lapic_timer.timer);
> -
> -               /* In case the sw timer triggered in the window */
> -               if (atomic_read(&apic->lapic_timer.pending) &&
> -                       !apic_lvtt_period(apic))
> -                       cancel_hv_timer(apic);
> +                       /* In case the sw timer triggered in the window */
> +                       if (atomic_read(&apic->lapic_timer.pending) &&
> +                           !apic_lvtt_period(apic))
> +                               need_cancel = true;
> +                       else if (r)
> +                               kvm_lapic_expired_hv_timer(vcpu);
> +               }
>         }
> +
> +       if (need_cancel)
> +               cancel_hv_timer(apic);
> +
>         trace_kvm_hv_timer_state(apic->vcpu->vcpu_id,
>                         apic->lapic_timer.hv_timer_in_use);
>         return apic->lapic_timer.hv_timer_in_use;
>
> but I'm afraid of introducing a mutual recursion between
> start_hv_timer and kvm_lapic_expired_hv_timer.
>
> Paolo
Paolo Bonzini June 28, 2017, 2 p.m. UTC | #2
On 28/06/2017 15:55, Wanpeng Li wrote:
>>>       if ((atomic_read(&apic->lapic_timer.pending) &&
>>>               !apic_lvtt_period(apic)) ||
>>> -             kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline)) {
>>> +             (ret = kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline))) {
>>>               if (apic->lapic_timer.hv_timer_in_use)
>>>                       cancel_hv_timer(apic);
>>> +             if (ret == 1) {
>>> +                     apic_timer_expired(apic);
>>> +                     return true;
>>> +             }
>> The preemption timer can also be used for modes other than TSC deadline.
>>
>> In periodic mode, your patch would miss a call to
>> advance_periodic_target_expiration, which is only called by
>> kvm_lapic_expired_hv_timer.
> Actually I considered this before, however, I referred to apic timer
> periodic mode which is emulated by hrtimer

Periodic mode can also be emulated by preemption timer... it was added
by some Wanpeng Li in commit 8003c9ae204e ("KVM: LAPIC: add APIC Timer
periodic/oneshot mode VMX preemption timer support", 2016-11-02), do you
know him? ;)

> , there is no hrtimer start
> for the next period in start_sw_period(). If it is also buggy?

start_sw_period always goes through the hrtimer for periodic timer:

        if (apic_lvtt_oneshot(apic) &&
            ktime_after(ktime_get(),
                        apic->lapic_timer.target_expiration)) {
                apic_timer_expired(apic);
                return;
        }

        hrtimer_start(&apic->lapic_timer.timer,
                apic->lapic_timer.target_expiration,
                HRTIMER_MODE_ABS_PINNED);

(the direct call to apic_timer_expired is conditonal to
apic_lvtt_oneshot).  This way, apic_timer_fn takes care of advancing the
hrtimer deadline and returning HRTIMER_RESTART.

Paolo
Wanpeng Li June 28, 2017, 2:05 p.m. UTC | #3
2017-06-28 22:00 GMT+08:00 Paolo Bonzini <pbonzini@redhat.com>:
>
>
> On 28/06/2017 15:55, Wanpeng Li wrote:
>>>>       if ((atomic_read(&apic->lapic_timer.pending) &&
>>>>               !apic_lvtt_period(apic)) ||
>>>> -             kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline)) {
>>>> +             (ret = kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline))) {
>>>>               if (apic->lapic_timer.hv_timer_in_use)
>>>>                       cancel_hv_timer(apic);
>>>> +             if (ret == 1) {
>>>> +                     apic_timer_expired(apic);
>>>> +                     return true;
>>>> +             }
>>> The preemption timer can also be used for modes other than TSC deadline.
>>>
>>> In periodic mode, your patch would miss a call to
>>> advance_periodic_target_expiration, which is only called by
>>> kvm_lapic_expired_hv_timer.
>> Actually I considered this before, however, I referred to apic timer
>> periodic mode which is emulated by hrtimer
>
> Periodic mode can also be emulated by preemption timer... it was added
> by some Wanpeng Li in commit 8003c9ae204e ("KVM: LAPIC: add APIC Timer
> periodic/oneshot mode VMX preemption timer support", 2016-11-02), do you
> know him? ;)

Indeed. :)

>
>> , there is no hrtimer start
>> for the next period in start_sw_period(). If it is also buggy?
>
> start_sw_period always goes through the hrtimer for periodic timer:
>
>         if (apic_lvtt_oneshot(apic) &&
>             ktime_after(ktime_get(),
>                         apic->lapic_timer.target_expiration)) {
>                 apic_timer_expired(apic);
>                 return;
>         }
>
>         hrtimer_start(&apic->lapic_timer.timer,
>                 apic->lapic_timer.target_expiration,
>                 HRTIMER_MODE_ABS_PINNED);
>
> (the direct call to apic_timer_expired is conditonal to
> apic_lvtt_oneshot).  This way, apic_timer_fn takes care of advancing the
> hrtimer deadline and returning HRTIMER_RESTART.

Ah, yes, I miss the apic_lvtt_oneshot() check here.

Regards,
Wanpeng Li
Wanpeng Li June 28, 2017, 2:27 p.m. UTC | #4
2017-06-28 20:10 GMT+08:00 Paolo Bonzini <pbonzini@redhat.com>:
>
>
> On 28/06/2017 03:29, Wanpeng Li wrote:
>>       u64 tscdeadline = apic->lapic_timer.tscdeadline;
>> +     int ret = 0;
>>
>>       if ((atomic_read(&apic->lapic_timer.pending) &&
>>               !apic_lvtt_period(apic)) ||
>> -             kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline)) {
>> +             (ret = kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline))) {
>>               if (apic->lapic_timer.hv_timer_in_use)
>>                       cancel_hv_timer(apic);
>> +             if (ret == 1) {
>> +                     apic_timer_expired(apic);
>> +                     return true;
>> +             }
>
> The preemption timer can also be used for modes other than TSC deadline.
>
> In periodic mode, your patch would miss a call to
> advance_periodic_target_expiration, which is only called by
> kvm_lapic_expired_hv_timer.
>
> You could use something like this:
>
> diff --git a/arch/x86/kvm/lapic.c b/arch/x86/kvm/lapic.c
> index d24c8742d9b0..15b751aa7625 100644
> --- a/arch/x86/kvm/lapic.c
> +++ b/arch/x86/kvm/lapic.c
> @@ -1504,21 +1504,26 @@ static void cancel_hv_timer(struct kvm_lapic *apic)
>  static bool start_hv_timer(struct kvm_lapic *apic)
>  {
>         u64 tscdeadline = apic->lapic_timer.tscdeadline;
> +       bool need_cancel = apic->lapic_timer.hv_timer_in_use;
> +       if (!atomic_read(&apic->lapic_timer.pending) || apic_lvtt_period(apic)) {
> +               int r = kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline);
> +               if (r >= 0) {
> +                       need_cancel = false;
> +                       apic->lapic_timer.hv_timer_in_use = true;
> +                       hrtimer_cancel(&apic->lapic_timer.timer);
>
> -       if ((atomic_read(&apic->lapic_timer.pending) &&
> -               !apic_lvtt_period(apic)) ||
> -               kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline)) {
> -               if (apic->lapic_timer.hv_timer_in_use)
> -                       cancel_hv_timer(apic);
> -       } else {
> -               apic->lapic_timer.hv_timer_in_use = true;
> -               hrtimer_cancel(&apic->lapic_timer.timer);
> -
> -               /* In case the sw timer triggered in the window */
> -               if (atomic_read(&apic->lapic_timer.pending) &&
> -                       !apic_lvtt_period(apic))
> -                       cancel_hv_timer(apic);
> +                       /* In case the sw timer triggered in the window */
> +                       if (atomic_read(&apic->lapic_timer.pending) &&
> +                           !apic_lvtt_period(apic))
> +                               need_cancel = true;
> +                       else if (r)
> +                               kvm_lapic_expired_hv_timer(vcpu);
> +               }
>         }
> +
> +       if (need_cancel)
> +               cancel_hv_timer(apic);
> +
>         trace_kvm_hv_timer_state(apic->vcpu->vcpu_id,
>                         apic->lapic_timer.hv_timer_in_use);
>         return apic->lapic_timer.hv_timer_in_use;
>
> but I'm afraid of introducing a mutual recursion between
> start_hv_timer and kvm_lapic_expired_hv_timer.

We can just handle the apic timer oneshot/tscdeadline mode instead of
periodic mode just like which is emulated by hrtimer to avoid the
mutual recusion, what do you think?

Regards,
Wanpeng Li
Paolo Bonzini June 28, 2017, 2:30 p.m. UTC | #5
On 28/06/2017 16:27, Wanpeng Li wrote:
> 2017-06-28 20:10 GMT+08:00 Paolo Bonzini <pbonzini@redhat.com>:
>>
>>
>> On 28/06/2017 03:29, Wanpeng Li wrote:
>>>       u64 tscdeadline = apic->lapic_timer.tscdeadline;
>>> +     int ret = 0;
>>>
>>>       if ((atomic_read(&apic->lapic_timer.pending) &&
>>>               !apic_lvtt_period(apic)) ||
>>> -             kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline)) {
>>> +             (ret = kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline))) {
>>>               if (apic->lapic_timer.hv_timer_in_use)
>>>                       cancel_hv_timer(apic);
>>> +             if (ret == 1) {
>>> +                     apic_timer_expired(apic);
>>> +                     return true;
>>> +             }
>>
>> The preemption timer can also be used for modes other than TSC deadline.
>>
>> In periodic mode, your patch would miss a call to
>> advance_periodic_target_expiration, which is only called by
>> kvm_lapic_expired_hv_timer.
>>
>> You could use something like this:
>>
>> diff --git a/arch/x86/kvm/lapic.c b/arch/x86/kvm/lapic.c
>> index d24c8742d9b0..15b751aa7625 100644
>> --- a/arch/x86/kvm/lapic.c
>> +++ b/arch/x86/kvm/lapic.c
>> @@ -1504,21 +1504,26 @@ static void cancel_hv_timer(struct kvm_lapic *apic)
>>  static bool start_hv_timer(struct kvm_lapic *apic)
>>  {
>>         u64 tscdeadline = apic->lapic_timer.tscdeadline;
>> +       bool need_cancel = apic->lapic_timer.hv_timer_in_use;
>> +       if (!atomic_read(&apic->lapic_timer.pending) || apic_lvtt_period(apic)) {
>> +               int r = kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline);
>> +               if (r >= 0) {
>> +                       need_cancel = false;
>> +                       apic->lapic_timer.hv_timer_in_use = true;
>> +                       hrtimer_cancel(&apic->lapic_timer.timer);
>>
>> -       if ((atomic_read(&apic->lapic_timer.pending) &&
>> -               !apic_lvtt_period(apic)) ||
>> -               kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline)) {
>> -               if (apic->lapic_timer.hv_timer_in_use)
>> -                       cancel_hv_timer(apic);
>> -       } else {
>> -               apic->lapic_timer.hv_timer_in_use = true;
>> -               hrtimer_cancel(&apic->lapic_timer.timer);
>> -
>> -               /* In case the sw timer triggered in the window */
>> -               if (atomic_read(&apic->lapic_timer.pending) &&
>> -                       !apic_lvtt_period(apic))
>> -                       cancel_hv_timer(apic);
>> +                       /* In case the sw timer triggered in the window */
>> +                       if (atomic_read(&apic->lapic_timer.pending) &&
>> +                           !apic_lvtt_period(apic))
>> +                               need_cancel = true;
>> +                       else if (r)
>> +                               kvm_lapic_expired_hv_timer(vcpu);
>> +               }
>>         }
>> +
>> +       if (need_cancel)
>> +               cancel_hv_timer(apic);
>> +
>>         trace_kvm_hv_timer_state(apic->vcpu->vcpu_id,
>>                         apic->lapic_timer.hv_timer_in_use);
>>         return apic->lapic_timer.hv_timer_in_use;
>>
>> but I'm afraid of introducing a mutual recursion between
>> start_hv_timer and kvm_lapic_expired_hv_timer.
> 
> We can just handle the apic timer oneshot/tscdeadline mode instead of
> periodic mode just like which is emulated by hrtimer to avoid the
> mutual recusion, what do you think?

In that case, set_hv_timer should probably always enable the preemption
timer.  You can then cancel it if it returns 1 _and_ the APIC timer's
mode is oneshot/tscdeadline.

Paolo
diff mbox

Patch

diff --git a/arch/x86/kvm/lapic.c b/arch/x86/kvm/lapic.c
index d24c8742d9b0..15b751aa7625 100644
--- a/arch/x86/kvm/lapic.c
+++ b/arch/x86/kvm/lapic.c
@@ -1504,21 +1504,26 @@  static void cancel_hv_timer(struct kvm_lapic *apic)
 static bool start_hv_timer(struct kvm_lapic *apic)
 {
 	u64 tscdeadline = apic->lapic_timer.tscdeadline;
+	bool need_cancel = apic->lapic_timer.hv_timer_in_use;
+	if (!atomic_read(&apic->lapic_timer.pending) || apic_lvtt_period(apic)) {
+		int r = kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline);
+		if (r >= 0) {
+			need_cancel = false;
+			apic->lapic_timer.hv_timer_in_use = true;
+			hrtimer_cancel(&apic->lapic_timer.timer);
 
-	if ((atomic_read(&apic->lapic_timer.pending) &&
-		!apic_lvtt_period(apic)) ||
-		kvm_x86_ops->set_hv_timer(apic->vcpu, tscdeadline)) {
-		if (apic->lapic_timer.hv_timer_in_use)
-			cancel_hv_timer(apic);
-	} else {
-		apic->lapic_timer.hv_timer_in_use = true;
-		hrtimer_cancel(&apic->lapic_timer.timer);
-
-		/* In case the sw timer triggered in the window */
-		if (atomic_read(&apic->lapic_timer.pending) &&
-			!apic_lvtt_period(apic))
-			cancel_hv_timer(apic);
+			/* In case the sw timer triggered in the window */
+			if (atomic_read(&apic->lapic_timer.pending) &&
+			    !apic_lvtt_period(apic))
+				need_cancel = true;
+			else if (r)
+				kvm_lapic_expired_hv_timer(vcpu);
+		}
 	}
+
+	if (need_cancel)
+		cancel_hv_timer(apic);
+
 	trace_kvm_hv_timer_state(apic->vcpu->vcpu_id,
 			apic->lapic_timer.hv_timer_in_use);
 	return apic->lapic_timer.hv_timer_in_use;