diff mbox

[v8,2/7] cpu: allocate cpu->trace_dstate in place

Message ID 1496975122-16999-3-git-send-email-cota@braap.org (mailing list archive)
State New, archived
Headers show

Commit Message

Emilio Cota June 9, 2017, 2:25 a.m. UTC
There's little point in dynamically allocating the bitmap if we
know at compile-time the max number of events we want to support.
Thus, make room in the struct for the bitmap, which will make things
easier later: this paves the way for upcoming changes, in which
we'll use a u32 to fully capture cpu->trace_dstate.

This change also increases performance by saving a dereference and
improving locality--note that this is important since upcoming work
makes reading this bitmap fairly common.

Signed-off-by: Emilio G. Cota <cota@braap.org>
---
 include/qom/cpu.h | 9 +++------
 qom/cpu.c         | 8 --------
 trace/control.c   | 9 ++++++++-
 3 files changed, 11 insertions(+), 15 deletions(-)

Comments

Lluís Vilanova June 11, 2017, 12:36 p.m. UTC | #1
Emilio G Cota writes:

> There's little point in dynamically allocating the bitmap if we
> know at compile-time the max number of events we want to support.
> Thus, make room in the struct for the bitmap, which will make things
> easier later: this paves the way for upcoming changes, in which
> we'll use a u32 to fully capture cpu->trace_dstate.

> This change also increases performance by saving a dereference and
> improving locality--note that this is important since upcoming work
> makes reading this bitmap fairly common.

> Signed-off-by: Emilio G. Cota <cota@braap.org>

Reviewed-by: Lluís Vilanova <vilanova@ac.upc.edu>


> ---
>  include/qom/cpu.h | 9 +++------
>  qom/cpu.c         | 8 --------
>  trace/control.c   | 9 ++++++++-
>  3 files changed, 11 insertions(+), 15 deletions(-)

> diff --git a/include/qom/cpu.h b/include/qom/cpu.h
> index 89ddb68..bc6e20f 100644
> --- a/include/qom/cpu.h
> +++ b/include/qom/cpu.h
> @@ -259,6 +259,7 @@ typedef void (*run_on_cpu_func)(CPUState *cpu, run_on_cpu_data data);
>  struct qemu_work_item;
 
>  #define CPU_UNSET_NUMA_NODE_ID -1
> +#define CPU_TRACE_DSTATE_MAX_EVENTS 32
 
>  /**
>   * CPUState:
> @@ -373,12 +374,8 @@ struct CPUState {
>      struct KVMState *kvm_state;
>      struct kvm_run *kvm_run;
 
> -    /*
> -     * Used for events with 'vcpu' and *without* the 'disabled' properties.
> -     * Dynamically allocated based on bitmap requried to hold up to
> -     * trace_get_vcpu_event_count() entries.
> -     */
> -    unsigned long *trace_dstate;
> +    /* Used for events with 'vcpu' and *without* the 'disabled' properties */
> +    DECLARE_BITMAP(trace_dstate, CPU_TRACE_DSTATE_MAX_EVENTS);
 
>      /* TODO Move common fields from CPUArchState here. */
>      int cpu_index; /* used by alpha TCG */
> diff --git a/qom/cpu.c b/qom/cpu.c
> index 5069876..69fbb9c 100644
> --- a/qom/cpu.c
> +++ b/qom/cpu.c
> @@ -382,7 +382,6 @@ static void cpu_common_unrealizefn(DeviceState *dev, Error **errp)
 
>  static void cpu_common_initfn(Object *obj)
>  {
> -    uint32_t count;
>      CPUState *cpu = CPU(obj);
>      CPUClass *cc = CPU_GET_CLASS(obj);
 
> @@ -397,18 +396,11 @@ static void cpu_common_initfn(Object *obj)
>      QTAILQ_INIT(&cpu->breakpoints);
>      QTAILQ_INIT(&cpu->watchpoints);
 
> -    count = trace_get_vcpu_event_count();
> -    if (count) {
> -        cpu->trace_dstate = bitmap_new(count);
> -    }
> -
>      cpu_exec_initfn(cpu);
>  }
 
>  static void cpu_common_finalize(Object *obj)
>  {
> -    CPUState *cpu = CPU(obj);
> -    g_free(cpu->trace_dstate);
>  }
 
>  static int64_t cpu_common_get_arch_id(CPUState *cpu)
> diff --git a/trace/control.c b/trace/control.c
> index 9b157b0..83740aa 100644
> --- a/trace/control.c
> +++ b/trace/control.c
> @@ -65,8 +65,15 @@ void trace_event_register_group(TraceEvent **events)
>      size_t i;
>      for (i = 0; events[i] != NULL; i++) {
>          events[i]->id = next_id++;
> -        if (events[i]->vcpu_id != TRACE_VCPU_EVENT_NONE) {
> +        if (events[i]->vcpu_id == TRACE_VCPU_EVENT_NONE) {
> +            continue;
> +        }
> +
> +        if (likely(next_vcpu_id < CPU_TRACE_DSTATE_MAX_EVENTS)) {
>              events[i]->vcpu_id = next_vcpu_id++;
> +        } else {
> +            error_report("WARNING: too many vcpu trace events; dropping '%s'",
> +                         events[i]->name);
>          }
>      }
>      event_groups = g_renew(TraceEventGroup, event_groups, nevent_groups + 1);
> -- 
> 2.7.4
Lluís Vilanova June 25, 2017, 9:41 a.m. UTC | #2
Lluís Vilanova writes:

> Emilio G Cota writes:
>> There's little point in dynamically allocating the bitmap if we
>> know at compile-time the max number of events we want to support.
>> Thus, make room in the struct for the bitmap, which will make things
>> easier later: this paves the way for upcoming changes, in which
>> we'll use a u32 to fully capture cpu->trace_dstate.

>> This change also increases performance by saving a dereference and
>> improving locality--note that this is important since upcoming work
>> makes reading this bitmap fairly common.

>> Signed-off-by: Emilio G. Cota <cota@braap.org>

> Reviewed-by: Lluís Vilanova <vilanova@ac.upc.edu>

BTW, I think this partially undoes Daniel's changes in
b7d48952c375842bd669460fd8384d90cc12286c.

You should check with him (CC'ed).

Lluis


>> ---
>> include/qom/cpu.h | 9 +++------
>> qom/cpu.c         | 8 --------
>> trace/control.c   | 9 ++++++++-
>> 3 files changed, 11 insertions(+), 15 deletions(-)

>> diff --git a/include/qom/cpu.h b/include/qom/cpu.h
>> index 89ddb68..bc6e20f 100644
>> --- a/include/qom/cpu.h
>> +++ b/include/qom/cpu.h
>> @@ -259,6 +259,7 @@ typedef void (*run_on_cpu_func)(CPUState *cpu, run_on_cpu_data data);
>> struct qemu_work_item;
 
>> #define CPU_UNSET_NUMA_NODE_ID -1
>> +#define CPU_TRACE_DSTATE_MAX_EVENTS 32
 
>> /**
>> * CPUState:
>> @@ -373,12 +374,8 @@ struct CPUState {
>> struct KVMState *kvm_state;
>> struct kvm_run *kvm_run;
 
>> -    /*
>> -     * Used for events with 'vcpu' and *without* the 'disabled' properties.
>> -     * Dynamically allocated based on bitmap requried to hold up to
>> -     * trace_get_vcpu_event_count() entries.
>> -     */
>> -    unsigned long *trace_dstate;
>> +    /* Used for events with 'vcpu' and *without* the 'disabled' properties */
>> +    DECLARE_BITMAP(trace_dstate, CPU_TRACE_DSTATE_MAX_EVENTS);
 
>> /* TODO Move common fields from CPUArchState here. */
>> int cpu_index; /* used by alpha TCG */
>> diff --git a/qom/cpu.c b/qom/cpu.c
>> index 5069876..69fbb9c 100644
>> --- a/qom/cpu.c
>> +++ b/qom/cpu.c
>> @@ -382,7 +382,6 @@ static void cpu_common_unrealizefn(DeviceState *dev, Error **errp)
 
>> static void cpu_common_initfn(Object *obj)
>> {
>> -    uint32_t count;
>> CPUState *cpu = CPU(obj);
>> CPUClass *cc = CPU_GET_CLASS(obj);
 
>> @@ -397,18 +396,11 @@ static void cpu_common_initfn(Object *obj)
>> QTAILQ_INIT(&cpu->breakpoints);
>> QTAILQ_INIT(&cpu->watchpoints);
 
>> -    count = trace_get_vcpu_event_count();
>> -    if (count) {
>> -        cpu->trace_dstate = bitmap_new(count);
>> -    }
>> -
>> cpu_exec_initfn(cpu);
>> }
 
>> static void cpu_common_finalize(Object *obj)
>> {
>> -    CPUState *cpu = CPU(obj);
>> -    g_free(cpu->trace_dstate);
>> }
 
>> static int64_t cpu_common_get_arch_id(CPUState *cpu)
>> diff --git a/trace/control.c b/trace/control.c
>> index 9b157b0..83740aa 100644
>> --- a/trace/control.c
>> +++ b/trace/control.c
>> @@ -65,8 +65,15 @@ void trace_event_register_group(TraceEvent **events)
>> size_t i;
>> for (i = 0; events[i] != NULL; i++) {
>> events[i]->id = next_id++;
>> -        if (events[i]->vcpu_id != TRACE_VCPU_EVENT_NONE) {
>> +        if (events[i]->vcpu_id == TRACE_VCPU_EVENT_NONE) {
>> +            continue;
>> +        }
>> +
>> +        if (likely(next_vcpu_id < CPU_TRACE_DSTATE_MAX_EVENTS)) {
>> events[i]->vcpu_id = next_vcpu_id++;
>> +        } else {
>> +            error_report("WARNING: too many vcpu trace events; dropping '%s'",
>> +                         events[i]->name);
>> }
>> }
>> event_groups = g_renew(TraceEventGroup, event_groups, nevent_groups + 1);
>> -- 
>> 2.7.4
Daniel P. Berrangé June 26, 2017, 8:26 a.m. UTC | #3
On Sun, Jun 25, 2017 at 12:41:57PM +0300, Lluís Vilanova wrote:
> Lluís Vilanova writes:
> 
> > Emilio G Cota writes:
> >> There's little point in dynamically allocating the bitmap if we
> >> know at compile-time the max number of events we want to support.
> >> Thus, make room in the struct for the bitmap, which will make things
> >> easier later: this paves the way for upcoming changes, in which
> >> we'll use a u32 to fully capture cpu->trace_dstate.
> 
> >> This change also increases performance by saving a dereference and
> >> improving locality--note that this is important since upcoming work
> >> makes reading this bitmap fairly common.
> 
> >> Signed-off-by: Emilio G. Cota <cota@braap.org>
> 
> > Reviewed-by: Lluís Vilanova <vilanova@ac.upc.edu>
> 
> BTW, I think this partially undoes Daniel's changes in
> b7d48952c375842bd669460fd8384d90cc12286c.
> 
> You should check with him (CC'ed).

That's ok - I only made those changes in order to remove the reliance on
the generated max vcpu event ID counter. Choosing to hardcode a fixed
limit on number of vcpu events instead is a fine alternative.

> 
> Lluis
> 
> 
> >> ---
> >> include/qom/cpu.h | 9 +++------
> >> qom/cpu.c         | 8 --------
> >> trace/control.c   | 9 ++++++++-
> >> 3 files changed, 11 insertions(+), 15 deletions(-)
> 
> >> diff --git a/include/qom/cpu.h b/include/qom/cpu.h
> >> index 89ddb68..bc6e20f 100644
> >> --- a/include/qom/cpu.h
> >> +++ b/include/qom/cpu.h
> >> @@ -259,6 +259,7 @@ typedef void (*run_on_cpu_func)(CPUState *cpu, run_on_cpu_data data);
> >> struct qemu_work_item;
>  
> >> #define CPU_UNSET_NUMA_NODE_ID -1
> >> +#define CPU_TRACE_DSTATE_MAX_EVENTS 32
>  
> >> /**
> >> * CPUState:
> >> @@ -373,12 +374,8 @@ struct CPUState {
> >> struct KVMState *kvm_state;
> >> struct kvm_run *kvm_run;
>  
> >> -    /*
> >> -     * Used for events with 'vcpu' and *without* the 'disabled' properties.
> >> -     * Dynamically allocated based on bitmap requried to hold up to
> >> -     * trace_get_vcpu_event_count() entries.
> >> -     */
> >> -    unsigned long *trace_dstate;
> >> +    /* Used for events with 'vcpu' and *without* the 'disabled' properties */
> >> +    DECLARE_BITMAP(trace_dstate, CPU_TRACE_DSTATE_MAX_EVENTS);
>  
> >> /* TODO Move common fields from CPUArchState here. */
> >> int cpu_index; /* used by alpha TCG */
> >> diff --git a/qom/cpu.c b/qom/cpu.c
> >> index 5069876..69fbb9c 100644
> >> --- a/qom/cpu.c
> >> +++ b/qom/cpu.c
> >> @@ -382,7 +382,6 @@ static void cpu_common_unrealizefn(DeviceState *dev, Error **errp)
>  
> >> static void cpu_common_initfn(Object *obj)
> >> {
> >> -    uint32_t count;
> >> CPUState *cpu = CPU(obj);
> >> CPUClass *cc = CPU_GET_CLASS(obj);
>  
> >> @@ -397,18 +396,11 @@ static void cpu_common_initfn(Object *obj)
> >> QTAILQ_INIT(&cpu->breakpoints);
> >> QTAILQ_INIT(&cpu->watchpoints);
>  
> >> -    count = trace_get_vcpu_event_count();
> >> -    if (count) {
> >> -        cpu->trace_dstate = bitmap_new(count);
> >> -    }
> >> -
> >> cpu_exec_initfn(cpu);
> >> }
>  
> >> static void cpu_common_finalize(Object *obj)
> >> {
> >> -    CPUState *cpu = CPU(obj);
> >> -    g_free(cpu->trace_dstate);
> >> }
>  
> >> static int64_t cpu_common_get_arch_id(CPUState *cpu)
> >> diff --git a/trace/control.c b/trace/control.c
> >> index 9b157b0..83740aa 100644
> >> --- a/trace/control.c
> >> +++ b/trace/control.c
> >> @@ -65,8 +65,15 @@ void trace_event_register_group(TraceEvent **events)
> >> size_t i;
> >> for (i = 0; events[i] != NULL; i++) {
> >> events[i]->id = next_id++;
> >> -        if (events[i]->vcpu_id != TRACE_VCPU_EVENT_NONE) {
> >> +        if (events[i]->vcpu_id == TRACE_VCPU_EVENT_NONE) {
> >> +            continue;
> >> +        }
> >> +
> >> +        if (likely(next_vcpu_id < CPU_TRACE_DSTATE_MAX_EVENTS)) {
> >> events[i]->vcpu_id = next_vcpu_id++;
> >> +        } else {
> >> +            error_report("WARNING: too many vcpu trace events; dropping '%s'",
> >> +                         events[i]->name);
> >> }

This should be an abort IMHO, as it would be considered a bug to have
added > 32 vcpu events.

I'd also suggest that the top level 'trace-events' file get a comment
added to the effect that we only support 32 events right now.

Regards,
Daniel
diff mbox

Patch

diff --git a/include/qom/cpu.h b/include/qom/cpu.h
index 89ddb68..bc6e20f 100644
--- a/include/qom/cpu.h
+++ b/include/qom/cpu.h
@@ -259,6 +259,7 @@  typedef void (*run_on_cpu_func)(CPUState *cpu, run_on_cpu_data data);
 struct qemu_work_item;
 
 #define CPU_UNSET_NUMA_NODE_ID -1
+#define CPU_TRACE_DSTATE_MAX_EVENTS 32
 
 /**
  * CPUState:
@@ -373,12 +374,8 @@  struct CPUState {
     struct KVMState *kvm_state;
     struct kvm_run *kvm_run;
 
-    /*
-     * Used for events with 'vcpu' and *without* the 'disabled' properties.
-     * Dynamically allocated based on bitmap requried to hold up to
-     * trace_get_vcpu_event_count() entries.
-     */
-    unsigned long *trace_dstate;
+    /* Used for events with 'vcpu' and *without* the 'disabled' properties */
+    DECLARE_BITMAP(trace_dstate, CPU_TRACE_DSTATE_MAX_EVENTS);
 
     /* TODO Move common fields from CPUArchState here. */
     int cpu_index; /* used by alpha TCG */
diff --git a/qom/cpu.c b/qom/cpu.c
index 5069876..69fbb9c 100644
--- a/qom/cpu.c
+++ b/qom/cpu.c
@@ -382,7 +382,6 @@  static void cpu_common_unrealizefn(DeviceState *dev, Error **errp)
 
 static void cpu_common_initfn(Object *obj)
 {
-    uint32_t count;
     CPUState *cpu = CPU(obj);
     CPUClass *cc = CPU_GET_CLASS(obj);
 
@@ -397,18 +396,11 @@  static void cpu_common_initfn(Object *obj)
     QTAILQ_INIT(&cpu->breakpoints);
     QTAILQ_INIT(&cpu->watchpoints);
 
-    count = trace_get_vcpu_event_count();
-    if (count) {
-        cpu->trace_dstate = bitmap_new(count);
-    }
-
     cpu_exec_initfn(cpu);
 }
 
 static void cpu_common_finalize(Object *obj)
 {
-    CPUState *cpu = CPU(obj);
-    g_free(cpu->trace_dstate);
 }
 
 static int64_t cpu_common_get_arch_id(CPUState *cpu)
diff --git a/trace/control.c b/trace/control.c
index 9b157b0..83740aa 100644
--- a/trace/control.c
+++ b/trace/control.c
@@ -65,8 +65,15 @@  void trace_event_register_group(TraceEvent **events)
     size_t i;
     for (i = 0; events[i] != NULL; i++) {
         events[i]->id = next_id++;
-        if (events[i]->vcpu_id != TRACE_VCPU_EVENT_NONE) {
+        if (events[i]->vcpu_id == TRACE_VCPU_EVENT_NONE) {
+            continue;
+        }
+
+        if (likely(next_vcpu_id < CPU_TRACE_DSTATE_MAX_EVENTS)) {
             events[i]->vcpu_id = next_vcpu_id++;
+        } else {
+            error_report("WARNING: too many vcpu trace events; dropping '%s'",
+                         events[i]->name);
         }
     }
     event_groups = g_renew(TraceEventGroup, event_groups, nevent_groups + 1);