aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--15.0.0/gentoo/32_all_genoutput-speedup.patch247
1 files changed, 0 insertions, 247 deletions
diff --git a/15.0.0/gentoo/32_all_genoutput-speedup.patch b/15.0.0/gentoo/32_all_genoutput-speedup.patch
deleted file mode 100644
index a379bf8..0000000
--- a/15.0.0/gentoo/32_all_genoutput-speedup.patch
+++ /dev/null
@@ -1,247 +0,0 @@
-https://inbox.sourceware.org/gcc-patches/20240814021909.37082-1-cooper.qu@linux.alibaba.com/
-
-From 23ea354ab6c1faf858120b65a0114c5d0bbeaf6e Mon Sep 17 00:00:00 2001
-Message-ID: <23ea354ab6c1faf858120b65a0114c5d0bbeaf6e.1723604026.git.sam@gentoo.org>
-From: Xianmiao Qu <cooper.qu@linux.alibaba.com>
-Date: Wed, 14 Aug 2024 10:19:09 +0800
-Subject: [PATCH] genoutput: Accelerate the place_operands function.
-
-With the increase in the number of modes and patterns for some
-backend architectures, the place_operands function becomes a
-bottleneck int the speed of genoutput, and may even become a
-bottleneck int the overall speed of building the GCC project.
-This patch aims to accelerate the place_operands function,
-the optimizations it includes are:
-1. Use a hash table to store operand information,
- improving the lookup time for the first operand.
-2. Move mode comparison to the beginning to avoid the scenarios of most strcmp.
-
-I tested the speed improvements for the following backends,
- Improvement Ratio
-x86_64 197.9%
-aarch64 954.5%
-riscv 2578.6%
-If the build machine is slow, then this improvement can save a lot of time.
-
-I tested the genoutput output for x86_64/aarch64/riscv backends,
-and there was no difference compared to before the optimization,
-so this shouldn't introduce any functional issues.
-
-gcc/
- * genoutput.cc (struct operand_data): Add member 'eq_next' to
- point to the next member with the same hash value in the
- hash table.
- (compare_operands): Move the comparison of the mode to the very
- beginning to accelerate the comparison of the two operands.
- (struct operand_data_hasher): New, a class that takes into account
- the necessary elements for comparing the equality of two operands
- in its hash value.
- (operand_data_hasher::hash): New.
- (operand_data_hasher::equal): New.
- (operand_datas): New, hash table of konwn pattern operands.
- (place_operands): Use a hash table instead of traversing the array
- to find the same operand.
- (main): Add initialization of the hash table 'operand_datas'.
----
- gcc/genoutput.cc | 111 +++++++++++++++++++++++++++++++++++++----------
- 1 file changed, 88 insertions(+), 23 deletions(-)
-
-diff --git a/gcc/genoutput.cc b/gcc/genoutput.cc
-index efd81766bb5b..16fd811b5dd5 100644
---- a/gcc/genoutput.cc
-+++ b/gcc/genoutput.cc
-@@ -91,6 +91,7 @@ along with GCC; see the file COPYING3. If not see
- #include "errors.h"
- #include "read-md.h"
- #include "gensupport.h"
-+#include "hash-table.h"
-
- /* No instruction can have more operands than this. Sorry for this
- arbitrary limit, but what machine will have an instruction with
-@@ -112,6 +113,8 @@ static int next_operand_number = 1;
- struct operand_data
- {
- struct operand_data *next;
-+ /* Point to the next member with the same hash value in the hash table. */
-+ struct operand_data *eq_next;
- int index;
- const char *predicate;
- const char *constraint;
-@@ -127,7 +130,7 @@ struct operand_data
-
- static struct operand_data null_operand =
- {
-- 0, 0, "", "", E_VOIDmode, 0, 0, 0, 0, 0
-+ 0, 0, 0, "", "", E_VOIDmode, 0, 0, 0, 0, 0
- };
-
- static struct operand_data *odata = &null_operand;
-@@ -174,8 +177,8 @@ static void output_operand_data (void);
- static void output_insn_data (void);
- static void output_get_insn_name (void);
- static void scan_operands (class data *, rtx, int, int);
--static int compare_operands (struct operand_data *,
-- struct operand_data *);
-+static int compare_operands (const struct operand_data *,
-+ const struct operand_data *);
- static void place_operands (class data *);
- static void process_template (class data *, const char *);
- static void validate_insn_alternatives (class data *);
-@@ -528,10 +531,18 @@ scan_operands (class data *d, rtx part, int this_address_p,
- /* Compare two operands for content equality. */
-
- static int
--compare_operands (struct operand_data *d0, struct operand_data *d1)
-+compare_operands (const struct operand_data *d0,
-+ const struct operand_data *d1)
- {
- const char *p0, *p1;
-
-+ /* On one hand, comparing strings for predicate and constraint
-+ is time-consuming, and on the other hand, the probability of
-+ different modes is relatively high. Therefore, checking the mode
-+ first can speed up the execution of the program. */
-+ if (d0->mode != d1->mode)
-+ return 0;
-+
- p0 = d0->predicate;
- if (!p0)
- p0 = "";
-@@ -550,9 +561,6 @@ compare_operands (struct operand_data *d0, struct operand_data *d1)
- if (strcmp (p0, p1) != 0)
- return 0;
-
-- if (d0->mode != d1->mode)
-- return 0;
--
- if (d0->strict_low != d1->strict_low)
- return 0;
-
-@@ -562,6 +570,46 @@ compare_operands (struct operand_data *d0, struct operand_data *d1)
- return 1;
- }
-
-+/* This is a class that takes into account the necessary elements for
-+ comparing the equality of two operands in its hash value. */
-+struct operand_data_hasher : nofree_ptr_hash <operand_data>
-+{
-+ static inline hashval_t hash (const operand_data *);
-+ static inline bool equal (const operand_data *, const operand_data *);
-+};
-+
-+hashval_t
-+operand_data_hasher::hash (const operand_data * op_info)
-+{
-+ inchash::hash h;
-+ const char *pred, *cons;
-+
-+ pred = op_info->predicate;
-+ if (!pred)
-+ pred = "";
-+ h.add (pred, strlen (pred) + 1);
-+
-+ cons = op_info->constraint;
-+ if (!cons)
-+ cons = "";
-+ h.add (cons, strlen (cons) + 1);
-+
-+ h.add_object (op_info->mode);
-+ h.add_object (op_info->strict_low);
-+ h.add_object (op_info->eliminable);
-+ return h.end ();
-+}
-+
-+bool
-+operand_data_hasher::equal (const operand_data * op_info1,
-+ const operand_data * op_info2)
-+{
-+ return compare_operands (op_info1, op_info2);
-+}
-+
-+/* Hashtable of konwn pattern operands. */
-+static hash_table<operand_data_hasher> *operand_datas;
-+
- /* Scan the list of operands we've already committed to output and either
- find a subsequence that is the same, or allocate a new one at the end. */
-
-@@ -569,6 +617,7 @@ static void
- place_operands (class data *d)
- {
- struct operand_data *od, *od2;
-+ struct operand_data **slot;
- int i;
-
- if (d->n_operands == 0)
-@@ -577,23 +626,24 @@ place_operands (class data *d)
- return;
- }
-
-+ od = operand_datas->find (&d->operand[0]);
- /* Brute force substring search. */
-- for (od = odata, i = 0; od; od = od->next, i = 0)
-- if (compare_operands (od, &d->operand[0]))
-- {
-- od2 = od->next;
-- i = 1;
-- while (1)
-- {
-- if (i == d->n_operands)
-- goto full_match;
-- if (od2 == NULL)
-- goto partial_match;
-- if (! compare_operands (od2, &d->operand[i]))
-- break;
-- ++i, od2 = od2->next;
-- }
-- }
-+ for (; od; od = od->eq_next)
-+ {
-+ od2 = od->next;
-+ i = 1;
-+ while (1)
-+ {
-+ if (i == d->n_operands)
-+ goto full_match;
-+ if (od2 == NULL)
-+ goto partial_match;
-+ if (! compare_operands (od2, &d->operand[i]))
-+ break;
-+ ++i, od2 = od2->next;
-+ }
-+ }
-+ i = 0;
-
- /* Either partial match at the end of the list, or no match. In either
- case, we tack on what operands are remaining to the end of the list. */
-@@ -605,6 +655,20 @@ place_operands (class data *d)
- *odata_end = od2;
- odata_end = &od2->next;
- od2->index = next_operand_number++;
-+ /* Insert the operand_data variable OD2 into the hash table.
-+ If a variable with the same hash value already exists in
-+ the hash table, insert the element at the end of the
-+ linked list connected through the eq_next member. */
-+ slot = operand_datas->find_slot (od2, INSERT);
-+ if (*slot)
-+ {
-+ struct operand_data *last = (struct operand_data *) *slot;
-+ while (last->eq_next)
-+ last = last->eq_next;
-+ last->eq_next = od2;
-+ }
-+ else
-+ *slot = od2;
- }
- *odata_end = NULL;
- return;
-@@ -1049,6 +1113,7 @@ main (int argc, const char **argv)
- progname = "genoutput";
-
- init_insn_for_nothing ();
-+ operand_datas = new hash_table<operand_data_hasher> (1024);
-
- if (!init_rtx_reader_args (argc, argv))
- return (FATAL_EXIT_CODE);
---
-2.45.2
-