diff mbox series

[v2,3/5] ACPI/PPTT: Modify node flag detection to find last IDENTICAL

Message ID 20190426220309.55654-4-jeremy.linton@arm.com (mailing list archive)
State Superseded, archived
Headers show
Series arm64: SPE ACPI enablement | expand

Commit Message

Jeremy Linton April 26, 2019, 10:03 p.m. UTC
The ACPI specification implies that the IDENTICAL flag should be
set on all non leaf nodes where the children are identical.
This means that we need to be searching for the last node with
the identical flag set rather than the first one.

To achieve this with the existing code we need to pass a
function through the tree traversal logic so we can check
the next node to assure that IDENTICAL isn't set before returning
a node with IDENTICAL set.

Signed-off-by: Jeremy Linton <jeremy.linton@arm.com>
---
 drivers/acpi/pptt.c | 62 +++++++++++++++++++++++++++++++++++----------
 1 file changed, 48 insertions(+), 14 deletions(-)

Comments

Rafael J. Wysocki April 29, 2019, 8:59 a.m. UTC | #1
On Sat, Apr 27, 2019 at 12:03 AM Jeremy Linton <jeremy.linton@arm.com> wrote:
>
> The ACPI specification implies that the IDENTICAL flag should be
> set on all non leaf nodes where the children are identical.
> This means that we need to be searching for the last node with
> the identical flag set rather than the first one.
>
> To achieve this with the existing code we need to pass a
> function through the tree traversal logic so we can check
> the next node to assure that IDENTICAL isn't set before returning
> a node with IDENTICAL set.
>
> Signed-off-by: Jeremy Linton <jeremy.linton@arm.com>
> ---
>  drivers/acpi/pptt.c | 62 +++++++++++++++++++++++++++++++++++----------
>  1 file changed, 48 insertions(+), 14 deletions(-)
>
> diff --git a/drivers/acpi/pptt.c b/drivers/acpi/pptt.c
> index 1865515297ca..39f660d8be0a 100644
> --- a/drivers/acpi/pptt.c
> +++ b/drivers/acpi/pptt.c
> @@ -432,17 +432,51 @@ static void cache_setup_acpi_cpu(struct acpi_table_header *table,
>         }
>  }
>
> +
> +typedef bool (*node_check)(struct acpi_table_header *table_hdr,
> +                          struct acpi_pptt_processor *cpu);

I would just use a function pointer with the entire arg list in the
function header(s).  Using this just makes things harder to follow
IMO.

> +static bool flag_package(struct acpi_table_header *table_hdr,
> +                        struct acpi_pptt_processor *cpu)
> +{
> +       return cpu->flags & ACPI_PPTT_PHYSICAL_PACKAGE;
> +}
> +
> +static bool flag_identical(struct acpi_table_header *table_hdr,
> +                          struct acpi_pptt_processor *cpu)
> +{
> +       struct acpi_pptt_processor *next;
> +
> +       /* heterogeneous machines must use PPTT revision > 1 */
> +       if (table_hdr->revision < 2)
> +               return false;
> +
> +       /* Locate the last node in the tree with IDENTICAL set */
> +       if (cpu->flags & ACPI_PPTT_ACPI_IDENTICAL) {
> +               next = fetch_pptt_node(table_hdr, cpu->parent);
> +               if (!(next && next->flags & ACPI_PPTT_ACPI_IDENTICAL))
> +                       return true;
> +       }
> +
> +       return false;
> +}
> +
> +static bool flag_none(struct acpi_table_header *table_hdr,
> +                     struct acpi_pptt_processor *cpu)
> +{
> +       return false;
> +}
> +
>  /* Passing level values greater than this will result in search termination */
>  #define PPTT_ABORT_PACKAGE 0xFF
>
> -static struct acpi_pptt_processor *acpi_find_processor_package_id(struct acpi_table_header *table_hdr,
> -                                                                 struct acpi_pptt_processor *cpu,
> -                                                                 int level, int flag)
> +static struct acpi_pptt_processor *acpi_find_processor_tag_id(struct acpi_table_header *table_hdr,
> +                                                             struct acpi_pptt_processor *cpu,
> +                                                             int level, node_check chk)
>  {
>         struct acpi_pptt_processor *prev_node;
>
>         while (cpu && level) {
> -               if (cpu->flags & flag)
> +               if (chk(table_hdr, cpu))
>                         break;
>                 pr_debug("level %d\n", level);
>                 prev_node = fetch_pptt_node(table_hdr, cpu->parent);
> @@ -473,15 +507,15 @@ static void acpi_pptt_warn_missing(void)
>   * Return: Unique value, or -ENOENT if unable to locate CPU
>   */
>  static int topology_get_acpi_cpu_tag(struct acpi_table_header *table,
> -                                    unsigned int cpu, int level, int flag)
> +                                    unsigned int cpu, int level, node_check chk)
>  {
>         struct acpi_pptt_processor *cpu_node;
>         u32 acpi_cpu_id = get_acpi_id_for_cpu(cpu);
>
>         cpu_node = acpi_find_processor_node(table, acpi_cpu_id);
>         if (cpu_node) {
> -               cpu_node = acpi_find_processor_package_id(table, cpu_node,
> -                                                         level, flag);
> +               cpu_node = acpi_find_processor_tag_id(table, cpu_node,
> +                                                         level, chk);
>                 /*
>                  * As per specification if the processor structure represents
>                  * an actual processor, then ACPI processor ID must be valid.
> @@ -498,7 +532,7 @@ static int topology_get_acpi_cpu_tag(struct acpi_table_header *table,
>         return -ENOENT;
>  }
>
> -static int find_acpi_cpu_topology_tag(unsigned int cpu, int level, int flag)
> +static int find_acpi_cpu_topology_tag(unsigned int cpu, int level, node_check chk)
>  {
>         struct acpi_table_header *table;
>         acpi_status status;
> @@ -509,7 +543,7 @@ static int find_acpi_cpu_topology_tag(unsigned int cpu, int level, int flag)
>                 acpi_pptt_warn_missing();
>                 return -ENOENT;
>         }
> -       retval = topology_get_acpi_cpu_tag(table, cpu, level, flag);
> +       retval = topology_get_acpi_cpu_tag(table, cpu, level, chk);
>         pr_debug("Topology Setup ACPI CPU %d, level %d ret = %d\n",
>                  cpu, level, retval);
>         acpi_put_table(table);
> @@ -601,7 +635,7 @@ int cache_setup_acpi(unsigned int cpu)
>   */
>  int find_acpi_cpu_topology(unsigned int cpu, int level)
>  {
> -       return find_acpi_cpu_topology_tag(cpu, level, 0);
> +       return find_acpi_cpu_topology_tag(cpu, level, flag_none);
>  }
>
>  /**
> @@ -658,7 +692,7 @@ int find_acpi_cpu_cache_topology(unsigned int cpu, int level)
>  int find_acpi_cpu_topology_package(unsigned int cpu)
>  {
>         return find_acpi_cpu_topology_tag(cpu, PPTT_ABORT_PACKAGE,
> -                                         ACPI_PPTT_PHYSICAL_PACKAGE);
> +                                         flag_package);
>  }
>
>  /**
> @@ -670,8 +704,8 @@ int find_acpi_cpu_topology_package(unsigned int cpu)
>   *
>   * The returned tag can be used to group peers with identical implementation.
>   *
> - * The search terminates when a level is found with the identical implementation
> - * flag set or we reach a root node.
> + * The search terminates when a level is found without the identical
> + * implementation flag set following a node with it set, or we reach the root.
>   *
>   * Due to limitations in the PPTT data structure, there may be rare situations
>   * where two cores in a heterogeneous machine may be identical, but won't have
> @@ -684,5 +718,5 @@ int find_acpi_cpu_topology_package(unsigned int cpu)
>  int find_acpi_cpu_topology_hetero_id(unsigned int cpu)
>  {
>         return find_acpi_cpu_topology_tag(cpu, PPTT_ABORT_PACKAGE,
> -                                         ACPI_PPTT_ACPI_IDENTICAL);
> +                                         flag_identical);
>  }
> --

I'm not a super big fan of passing function pointers in general.

I kind of see how this works for you, but why exactly the flag
(ACPI_PPTT_ACPI_IDENTICAL in this case) is not sufficient to
distinguish between the cases?
Jeremy Linton May 1, 2019, 4:23 p.m. UTC | #2
Hi,

On 4/29/19 3:59 AM, Rafael J. Wysocki wrote:
> On Sat, Apr 27, 2019 at 12:03 AM Jeremy Linton <jeremy.linton@arm.com> wrote:
>>
>> The ACPI specification implies that the IDENTICAL flag should be
>> set on all non leaf nodes where the children are identical.
>> This means that we need to be searching for the last node with
>> the identical flag set rather than the first one.
>>
>> To achieve this with the existing code we need to pass a
>> function through the tree traversal logic so we can check
>> the next node to assure that IDENTICAL isn't set before returning
>> a node with IDENTICAL set.
>>
>> Signed-off-by: Jeremy Linton <jeremy.linton@arm.com>
>> ---
>>   drivers/acpi/pptt.c | 62 +++++++++++++++++++++++++++++++++++----------
>>   1 file changed, 48 insertions(+), 14 deletions(-)
>>
>> diff --git a/drivers/acpi/pptt.c b/drivers/acpi/pptt.c
>> index 1865515297ca..39f660d8be0a 100644
>> --- a/drivers/acpi/pptt.c
>> +++ b/drivers/acpi/pptt.c
>> @@ -432,17 +432,51 @@ static void cache_setup_acpi_cpu(struct acpi_table_header *table,
>>          }
>>   }
>>
>> +
>> +typedef bool (*node_check)(struct acpi_table_header *table_hdr,
>> +                          struct acpi_pptt_processor *cpu);
> 
> I would just use a function pointer with the entire arg list in the
> function header(s).  Using this just makes things harder to follow
> IMO.

Ok... that makes the headers a bit big, maybe there is a better way.


> 
>> +static bool flag_package(struct acpi_table_header *table_hdr,
>> +                        struct acpi_pptt_processor *cpu)
>> +{
>> +       return cpu->flags & ACPI_PPTT_PHYSICAL_PACKAGE;
>> +}
>> +
>> +static bool flag_identical(struct acpi_table_header *table_hdr,
>> +                          struct acpi_pptt_processor *cpu)
>> +{
>> +       struct acpi_pptt_processor *next;
>> +
>> +       /* heterogeneous machines must use PPTT revision > 1 */
>> +       if (table_hdr->revision < 2)
>> +               return false;
>> +
>> +       /* Locate the last node in the tree with IDENTICAL set */
>> +       if (cpu->flags & ACPI_PPTT_ACPI_IDENTICAL) {
>> +               next = fetch_pptt_node(table_hdr, cpu->parent);
>> +               if (!(next && next->flags & ACPI_PPTT_ACPI_IDENTICAL))
>> +                       return true;
>> +       }
>> +
>> +       return false;
>> +}
>> +
>> +static bool flag_none(struct acpi_table_header *table_hdr,
>> +                     struct acpi_pptt_processor *cpu)
>> +{
>> +       return false;
>> +}
>> +
>>   /* Passing level values greater than this will result in search termination */
>>   #define PPTT_ABORT_PACKAGE 0xFF
>>
>> -static struct acpi_pptt_processor *acpi_find_processor_package_id(struct acpi_table_header *table_hdr,
>> -                                                                 struct acpi_pptt_processor *cpu,
>> -                                                                 int level, int flag)
>> +static struct acpi_pptt_processor *acpi_find_processor_tag_id(struct acpi_table_header *table_hdr,
>> +                                                             struct acpi_pptt_processor *cpu,
>> +                                                             int level, node_check chk)
>>   {
>>          struct acpi_pptt_processor *prev_node;
>>
>>          while (cpu && level) {
>> -               if (cpu->flags & flag)
>> +               if (chk(table_hdr, cpu))
>>                          break;
>>                  pr_debug("level %d\n", level);
>>                  prev_node = fetch_pptt_node(table_hdr, cpu->parent);
>> @@ -473,15 +507,15 @@ static void acpi_pptt_warn_missing(void)
>>    * Return: Unique value, or -ENOENT if unable to locate CPU
>>    */
>>   static int topology_get_acpi_cpu_tag(struct acpi_table_header *table,
>> -                                    unsigned int cpu, int level, int flag)
>> +                                    unsigned int cpu, int level, node_check chk)
>>   {
>>          struct acpi_pptt_processor *cpu_node;
>>          u32 acpi_cpu_id = get_acpi_id_for_cpu(cpu);
>>
>>          cpu_node = acpi_find_processor_node(table, acpi_cpu_id);
>>          if (cpu_node) {
>> -               cpu_node = acpi_find_processor_package_id(table, cpu_node,
>> -                                                         level, flag);
>> +               cpu_node = acpi_find_processor_tag_id(table, cpu_node,
>> +                                                         level, chk);
>>                  /*
>>                   * As per specification if the processor structure represents
>>                   * an actual processor, then ACPI processor ID must be valid.
>> @@ -498,7 +532,7 @@ static int topology_get_acpi_cpu_tag(struct acpi_table_header *table,
>>          return -ENOENT;
>>   }
>>
>> -static int find_acpi_cpu_topology_tag(unsigned int cpu, int level, int flag)
>> +static int find_acpi_cpu_topology_tag(unsigned int cpu, int level, node_check chk)
>>   {
>>          struct acpi_table_header *table;
>>          acpi_status status;
>> @@ -509,7 +543,7 @@ static int find_acpi_cpu_topology_tag(unsigned int cpu, int level, int flag)
>>                  acpi_pptt_warn_missing();
>>                  return -ENOENT;
>>          }
>> -       retval = topology_get_acpi_cpu_tag(table, cpu, level, flag);
>> +       retval = topology_get_acpi_cpu_tag(table, cpu, level, chk);
>>          pr_debug("Topology Setup ACPI CPU %d, level %d ret = %d\n",
>>                   cpu, level, retval);
>>          acpi_put_table(table);
>> @@ -601,7 +635,7 @@ int cache_setup_acpi(unsigned int cpu)
>>    */
>>   int find_acpi_cpu_topology(unsigned int cpu, int level)
>>   {
>> -       return find_acpi_cpu_topology_tag(cpu, level, 0);
>> +       return find_acpi_cpu_topology_tag(cpu, level, flag_none);
>>   }
>>
>>   /**
>> @@ -658,7 +692,7 @@ int find_acpi_cpu_cache_topology(unsigned int cpu, int level)
>>   int find_acpi_cpu_topology_package(unsigned int cpu)
>>   {
>>          return find_acpi_cpu_topology_tag(cpu, PPTT_ABORT_PACKAGE,
>> -                                         ACPI_PPTT_PHYSICAL_PACKAGE);
>> +                                         flag_package);
>>   }
>>
>>   /**
>> @@ -670,8 +704,8 @@ int find_acpi_cpu_topology_package(unsigned int cpu)
>>    *
>>    * The returned tag can be used to group peers with identical implementation.
>>    *
>> - * The search terminates when a level is found with the identical implementation
>> - * flag set or we reach a root node.
>> + * The search terminates when a level is found without the identical
>> + * implementation flag set following a node with it set, or we reach the root.
>>    *
>>    * Due to limitations in the PPTT data structure, there may be rare situations
>>    * where two cores in a heterogeneous machine may be identical, but won't have
>> @@ -684,5 +718,5 @@ int find_acpi_cpu_topology_package(unsigned int cpu)
>>   int find_acpi_cpu_topology_hetero_id(unsigned int cpu)
>>   {
>>          return find_acpi_cpu_topology_tag(cpu, PPTT_ABORT_PACKAGE,
>> -                                         ACPI_PPTT_ACPI_IDENTICAL);
>> +                                         flag_identical);
>>   }
>> --
> 
> I'm not a super big fan of passing function pointers in general.

Me either really, but it was fairly concise here. We could just switch 
on the flag and opencode the IDENTICAL special case in 
acpi_find_processor_tag_id(). I wouldn't expect there to be too many 
special case flags like this so that may be a better solution.

OTOH, I'm not even sure this patch is the right thing to do, it depends 
on how you read the intention of the spec. That is why I haven't merged 
it with 2/5 and AFAIK, the one machine that was setting the IDENTICAL 
flags everywhere had another problem which is forcing them to update the 
table, and they appear to have also corrected the table to only set it 
on the final identical node.

So, maybe I should drop this piece of the set and wait for someone to 
complain or the spec to be clarified?

> 
> I kind of see how this works for you, but why exactly the flag
> (ACPI_PPTT_ACPI_IDENTICAL in this case) is not sufficient to
> distinguish between the cases?
> 

I guess I'm not clear what your asking here, maybe just a clarification 
of why this patch is needed vs just 2/5? Under that assumption:

The spec reads "A value of 1 indicates that all children processors 
share an identical implementation revision". So AFAIK the intention was 
that it behaves like the Physical package flag, which has an additional 
clarification which reads "Each valid processor must belong to exactly 
one package". Minus that blurb, it seems a valid interpretation is that 
a homogeneous machine can have the IDENTICAL flag set on every non-leaf 
node. Since we are traversing the tree from the leaf to the root 
(because that is the way the tree is structured) we need to find the 
last node along the traversal with the IDENTICAL set in order to return 
the common node closest to the root. With just 2/5 we end up returning 
the node closest the leaf, which means processors which share a 
IDENTICAL node won't necessarily have duplicate tags (which is what we 
need).

If we can assume that there is only a single IDENTICAL flag along the 
path between any given leaf and the root, this patch would not be necessary.
diff mbox series

Patch

diff --git a/drivers/acpi/pptt.c b/drivers/acpi/pptt.c
index 1865515297ca..39f660d8be0a 100644
--- a/drivers/acpi/pptt.c
+++ b/drivers/acpi/pptt.c
@@ -432,17 +432,51 @@  static void cache_setup_acpi_cpu(struct acpi_table_header *table,
 	}
 }
 
+
+typedef bool (*node_check)(struct acpi_table_header *table_hdr,
+			   struct acpi_pptt_processor *cpu);
+static bool flag_package(struct acpi_table_header *table_hdr,
+			 struct acpi_pptt_processor *cpu)
+{
+	return cpu->flags & ACPI_PPTT_PHYSICAL_PACKAGE;
+}
+
+static bool flag_identical(struct acpi_table_header *table_hdr,
+			   struct acpi_pptt_processor *cpu)
+{
+	struct acpi_pptt_processor *next;
+
+	/* heterogeneous machines must use PPTT revision > 1 */
+	if (table_hdr->revision < 2)
+		return false;
+
+	/* Locate the last node in the tree with IDENTICAL set */
+	if (cpu->flags & ACPI_PPTT_ACPI_IDENTICAL) {
+		next = fetch_pptt_node(table_hdr, cpu->parent);
+		if (!(next && next->flags & ACPI_PPTT_ACPI_IDENTICAL))
+			return true;
+	}
+
+	return false;
+}
+
+static bool flag_none(struct acpi_table_header *table_hdr,
+		      struct acpi_pptt_processor *cpu)
+{
+	return false;
+}
+
 /* Passing level values greater than this will result in search termination */
 #define PPTT_ABORT_PACKAGE 0xFF
 
-static struct acpi_pptt_processor *acpi_find_processor_package_id(struct acpi_table_header *table_hdr,
-								  struct acpi_pptt_processor *cpu,
-								  int level, int flag)
+static struct acpi_pptt_processor *acpi_find_processor_tag_id(struct acpi_table_header *table_hdr,
+							      struct acpi_pptt_processor *cpu,
+							      int level, node_check chk)
 {
 	struct acpi_pptt_processor *prev_node;
 
 	while (cpu && level) {
-		if (cpu->flags & flag)
+		if (chk(table_hdr, cpu))
 			break;
 		pr_debug("level %d\n", level);
 		prev_node = fetch_pptt_node(table_hdr, cpu->parent);
@@ -473,15 +507,15 @@  static void acpi_pptt_warn_missing(void)
  * Return: Unique value, or -ENOENT if unable to locate CPU
  */
 static int topology_get_acpi_cpu_tag(struct acpi_table_header *table,
-				     unsigned int cpu, int level, int flag)
+				     unsigned int cpu, int level, node_check chk)
 {
 	struct acpi_pptt_processor *cpu_node;
 	u32 acpi_cpu_id = get_acpi_id_for_cpu(cpu);
 
 	cpu_node = acpi_find_processor_node(table, acpi_cpu_id);
 	if (cpu_node) {
-		cpu_node = acpi_find_processor_package_id(table, cpu_node,
-							  level, flag);
+		cpu_node = acpi_find_processor_tag_id(table, cpu_node,
+							  level, chk);
 		/*
 		 * As per specification if the processor structure represents
 		 * an actual processor, then ACPI processor ID must be valid.
@@ -498,7 +532,7 @@  static int topology_get_acpi_cpu_tag(struct acpi_table_header *table,
 	return -ENOENT;
 }
 
-static int find_acpi_cpu_topology_tag(unsigned int cpu, int level, int flag)
+static int find_acpi_cpu_topology_tag(unsigned int cpu, int level, node_check chk)
 {
 	struct acpi_table_header *table;
 	acpi_status status;
@@ -509,7 +543,7 @@  static int find_acpi_cpu_topology_tag(unsigned int cpu, int level, int flag)
 		acpi_pptt_warn_missing();
 		return -ENOENT;
 	}
-	retval = topology_get_acpi_cpu_tag(table, cpu, level, flag);
+	retval = topology_get_acpi_cpu_tag(table, cpu, level, chk);
 	pr_debug("Topology Setup ACPI CPU %d, level %d ret = %d\n",
 		 cpu, level, retval);
 	acpi_put_table(table);
@@ -601,7 +635,7 @@  int cache_setup_acpi(unsigned int cpu)
  */
 int find_acpi_cpu_topology(unsigned int cpu, int level)
 {
-	return find_acpi_cpu_topology_tag(cpu, level, 0);
+	return find_acpi_cpu_topology_tag(cpu, level, flag_none);
 }
 
 /**
@@ -658,7 +692,7 @@  int find_acpi_cpu_cache_topology(unsigned int cpu, int level)
 int find_acpi_cpu_topology_package(unsigned int cpu)
 {
 	return find_acpi_cpu_topology_tag(cpu, PPTT_ABORT_PACKAGE,
-					  ACPI_PPTT_PHYSICAL_PACKAGE);
+					  flag_package);
 }
 
 /**
@@ -670,8 +704,8 @@  int find_acpi_cpu_topology_package(unsigned int cpu)
  *
  * The returned tag can be used to group peers with identical implementation.
  *
- * The search terminates when a level is found with the identical implementation
- * flag set or we reach a root node.
+ * The search terminates when a level is found without the identical
+ * implementation flag set following a node with it set, or we reach the root.
  *
  * Due to limitations in the PPTT data structure, there may be rare situations
  * where two cores in a heterogeneous machine may be identical, but won't have
@@ -684,5 +718,5 @@  int find_acpi_cpu_topology_package(unsigned int cpu)
 int find_acpi_cpu_topology_hetero_id(unsigned int cpu)
 {
 	return find_acpi_cpu_topology_tag(cpu, PPTT_ABORT_PACKAGE,
-					  ACPI_PPTT_ACPI_IDENTICAL);
+					  flag_identical);
 }