Break up code for easier reg-alloc

Summary: Some enum code we encounter has a large live set of registers, which is detrimental to compilation speed (especially register allocation). We can reorder the code and stay observationally equivalent (in non-OOM situations). This also has the benefit of eliding many `move`s in the code and leads to a modest size improvement. Reviewed By: thezhangwei Differential Revision: D48279448 fbshipit-source-id: 6b39868300e423e94a7a6458e607737883cb9391
SeeYouOneDayDay · Aug 17, 2023 · f786d1b · f786d1b
1 parent bb3b9f5
commit f786d1b
Show file tree

Hide file tree

Showing 6 changed files with 585 additions and 1 deletion.
diff --git a/Makefile.am b/Makefile.am
@@ -420,7 +420,8 @@ libopt_la_SOURCES = \
 	opt/peephole/RedundantCheckCastRemover.cpp \
 	opt/print-kotlin-stats/PrintKotlinStats.cpp \
 	opt/print-members/PrintMembers.cpp \
-  opt/reachable-natives/ReachableNatives.cpp \
+	opt/reachable-natives/ReachableNatives.cpp \
+	opt/rearrange-enum-clinit/RearrangeEnumClinit.cpp \
 	opt/rebindrefs/ReBindRefs.cpp \
 	opt/regalloc/RegAlloc.cpp \
 	opt/regalloc-fast/FastRegAlloc.cpp \

diff --git a/Makefile.inc b/Makefile.inc
@@ -59,6 +59,7 @@ COMMON_INCLUDES = \
 	-I$(top_srcdir)/opt/peephole \
 	-I$(top_srcdir)/opt/print-members \
 	-I$(top_srcdir)/opt/print-kotlin-stats \
+	-I$(top_srcdir)/opt/rearrange-enum-clinit \
 	-I$(top_srcdir)/opt/rebindrefs \
 	-I$(top_srcdir)/opt/reduce-array-literals \
 	-I$(top_srcdir)/opt/reduce-boolean-branches \

diff --git a/opt/rearrange-enum-clinit/RearrangeEnumClinit.cpp b/opt/rearrange-enum-clinit/RearrangeEnumClinit.cpp
@@ -0,0 +1,315 @@
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
+ *
+ * This source code is licensed under the MIT license found in the
+ * LICENSE file in the root directory of this source tree.
+ */
+
+#include "RearrangeEnumClinit.h"
+
+#include <atomic>
+
+#include "Debug.h"
+#include "DexUtil.h"
+#include "IRCode.h"
+#include "LiveRange.h"
+#include "MethodUtil.h"
+#include "PassManager.h"
+#include "ScopedCFG.h"
+#include "Show.h"
+#include "Walkers.h"
+
+namespace rearrange_enum_clinit {
+namespace {
+
+struct Rearranger {
+  DexMethod* m;
+  cfg::ControlFlowGraph& cfg;
+  cfg::Block* b;
+
+  live_range::MoveAwareChains mac;
+  live_range::DefUseChains def_use;
+  live_range::UseDefChains use_def;
+
+  std::unordered_map<const IRInstruction*, IRList::iterator> insn_map;
+
+  IRInstruction* array_sput{nullptr};
+  IRList::iterator array_new_array;
+  reg_t alloc_reg;
+
+  Rearranger(DexMethod* m, cfg::ControlFlowGraph& cfg)
+      : m(m),
+        cfg(cfg),
+        b(cfg.entry_block()),
+        mac(cfg),
+        def_use(mac.get_def_use_chains()),
+        use_def(mac.get_use_def_chains()),
+        insn_map([](auto* block) {
+          std::unordered_map<const IRInstruction*, IRList::iterator> map;
+          for (auto it = block->begin(); it != block->end(); ++it) {
+            if (it->type == MFLOW_OPCODE) {
+              map.emplace(it->insn, it);
+            }
+          }
+          return map;
+        }(cfg.entry_block())) {}
+
+  IRInstruction* find_values_sput() {
+    for (auto it = b->rbegin(); it != b->rend(); ++it) {
+      if (it->type == MFLOW_OPCODE &&
+          it->insn->opcode() == OPCODE_SPUT_OBJECT) {
+        auto* f = it->insn->get_field();
+        if (f->get_class() == m->get_class() &&
+            f->get_name()->str() == "$VALUES") {
+          return it->insn;
+        }
+      }
+    }
+    not_reached();
+  }
+
+  reg_t move_new_array_to_front() {
+    redex_assert(array_new_array != b->begin());
+    auto orig_new_array_size_it = std::prev(array_new_array);
+    redex_assert(orig_new_array_size_it->type == MFLOW_OPCODE);
+    redex_assert(orig_new_array_size_it->insn->opcode() == OPCODE_CONST);
+
+    // Just move to the front. This does not handle source blocks. Assume
+    // this is not important for now.
+    auto new_array_it = b->begin();
+    while (new_array_it->type != MFLOW_OPCODE) {
+      ++new_array_it;
+    }
+
+    // Should not be necessary, but for safety.
+    reg_t size_reg = cfg.allocate_temp();
+
+    reg_t new_reg = cfg.allocate_temp();
+
+    b->insert_before(
+        b->to_cfg_instruction_iterator(new_array_it),
+        {
+            (new IRInstruction(*orig_new_array_size_it->insn))
+                ->set_dest(size_reg),
+            (new IRInstruction(*array_new_array->insn))->set_src(0, size_reg),
+            (new IRInstruction(IOPCODE_MOVE_RESULT_PSEUDO_OBJECT))
+                ->set_dest(new_reg),
+        });
+
+    array_sput->set_src(0, new_reg);
+
+    // Leave the size around in case it was referenced for something else.
+    // Will be cleaned up by shrinker.
+
+    return new_reg;
+  }
+
+  IRInstruction* find_singleton_def(IRInstruction* use_insn,
+                                    src_index_t src_index) {
+    auto it = use_def.find(live_range::Use{use_insn, src_index});
+    redex_assert(it != use_def.end());
+    redex_assert(it->second.size() == 1);
+    return *it->second.begin();
+  }
+
+  std::pair<IRList::iterator, reg_t> find_move_point_new_instance(
+      IRInstruction* object_insn) {
+    auto it = def_use.find(object_insn);
+    redex_assert(it != def_use.end());
+    std::optional<reg_t> which_reg{};
+    std::optional<IRList::iterator> which_it{};
+    for (auto& obj_use : it->second) {
+      if (obj_use.src_index == 0 &&
+          opcode::is_an_invoke(obj_use.insn->opcode()) &&
+          method::is_constructor(obj_use.insn->get_method())) {
+        redex_assert(!which_reg);
+        which_reg = obj_use.insn->src(0);
+        which_it = insn_map.at(obj_use.insn);
+      }
+    }
+    redex_assert(which_reg);
+    return std::make_pair(*which_it, *which_reg);
+  }
+
+  std::pair<IRList::iterator, reg_t> find_move_point(
+      IRInstruction* object_insn) {
+    if (object_insn->opcode() != OPCODE_NEW_INSTANCE) {
+      auto object_it = insn_map.at(object_insn);
+
+      if (object_insn->has_move_result_any()) {
+        ++object_it;
+        while (object_it->type != MFLOW_OPCODE) {
+          ++object_it;
+        }
+        redex_assert(opcode::is_move_result_any(object_it->insn->opcode()));
+      }
+      return std::make_pair(object_it, object_it->insn->dest());
+    }
+    return find_move_point_new_instance(object_insn);
+  }
+
+  bool run() {
+    // Find a sput-object for `$VALUES`.
+    array_sput = find_values_sput();
+    redex_assert(array_sput->opcode() == OPCODE_SPUT_OBJECT);
+
+    // Find the definition of the field object.
+    array_new_array = insn_map.at(find_singleton_def(array_sput, 0));
+
+    if (array_new_array->insn->opcode() != OPCODE_NEW_ARRAY) {
+      // Possibly Kotlin enum with `.$values()` not inlined, yet.
+      return false;
+    }
+
+    bool moved_new_array{false};
+    auto move_array = [&]() {
+      if (moved_new_array) {
+        return;
+      }
+      alloc_reg = move_new_array_to_front();
+      moved_new_array = true;
+    };
+
+    // Move array to front, use a new register.
+
+    // Find all the users of the array. This should be aput-object things.
+    {
+      auto new_array_uses_it = def_use.find(array_new_array->insn);
+      redex_assert(new_array_uses_it != def_use.end());
+      std::optional<reg_t> extra_reg{};
+      for (auto& use : new_array_uses_it->second) {
+        // Skip the sput.
+        if (use.insn == array_sput) {
+          continue;
+        }
+        assert_log(use.insn->opcode() == OPCODE_APUT_OBJECT,
+                   "Unexpected opcode %x",
+                   use.insn->opcode());
+
+        // Check what the definition is.
+        IRInstruction* object_insn = find_singleton_def(use.insn, 0);
+        if (object_insn->opcode() == OPCODE_SGET_OBJECT) {
+          // Field read style, does not really benefit from moving.
+          continue;
+        }
+
+        // OK, may be beneficial.
+        move_array();
+
+        if (!extra_reg) {
+          extra_reg = cfg.allocate_temp();
+        }
+
+        // See if we can hoist it. Check the input parameters.
+        // 1. First parameter is object. Already checked above.
+
+        // 2. Third parameter is index, should be const.
+        IRInstruction* index_insn = find_singleton_def(use.insn, 2);
+        redex_assert(index_insn->opcode() == OPCODE_CONST);
+
+        // We need to find the point where the object is fully
+        // constructed. If the object_insn is a NEW_INSTANCE, search for the
+        // following <init> call. Otherwise just use the result.
+        auto [insert_after_it, obj_reg] = find_move_point(object_insn);
+
+        b->insert_after(
+            b->to_cfg_instruction_iterator(insert_after_it),
+            {
+                (new IRInstruction(*index_insn))->set_dest(*extra_reg),
+                (new IRInstruction(*use.insn))
+                    ->set_src(0, obj_reg)
+                    ->set_src(1, alloc_reg)
+                    ->set_src(2, *extra_reg),
+            });
+
+        // Remove the old aput.
+        b->remove_insn(cfg.find_insn(use.insn, b).unwrap());
+      }
+    }
+
+    if (!moved_new_array) {
+      return false;
+    }
+
+    // Finally remove the old new-array. Do it late so there's no undefined
+    // behavior with deleted things.
+    b->remove_insn(array_new_array);
+
+    return true;
+  }
+};
+
+} // namespace
+
+MethodResult RearrangeEnumClinitPass::run(DexMethod* m, IRCode* code) {
+  auto cfg = cfg::ScopedCFG(code);
+  if (cfg->num_blocks() != 1) {
+    return MethodResult::kNotOneBlock;
+  }
+
+  auto res = Rearranger(m, *cfg).run();
+
+  return res ? MethodResult::kChanged : MethodResult::kFailed;
+}
+
+void RearrangeEnumClinitPass::run_pass(DexStoresVector& stores,
+                                       ConfigFiles&,
+                                       PassManager& mgr) {
+  std::atomic<size_t> cnt_all{0};
+  std::atomic<size_t> cnt_not_one_block{0};
+  std::atomic<size_t> cnt_no_clinit{0};
+  std::atomic<size_t> cnt_below_threshold{0};
+  std::atomic<size_t> cnt_failed{0};
+  std::atomic<size_t> cnt_changed{0};
+
+  walk::parallel::classes(build_class_scope(stores), [&](DexClass* c) {
+    if (c->is_external() || !is_enum(c)) {
+      return;
+    }
+
+    cnt_all.fetch_add(1, std::memory_order_relaxed);
+
+    auto* m = c->get_clinit();
+    if (m == nullptr) {
+      // This case can happen for anonymous classes used when an enum case is
+      // specialized.
+      cnt_no_clinit.fetch_add(1, std::memory_order_relaxed);
+      return;
+    }
+
+    if (m->get_code()->count_opcodes() < m_threshold) {
+      cnt_below_threshold.fetch_add(1, std::memory_order_relaxed);
+      return;
+    }
+
+    auto res = run(m, m->get_code());
+
+    switch (res) {
+    case MethodResult::kUnknown:
+      not_reached();
+
+    case MethodResult::kNotOneBlock:
+      cnt_not_one_block.fetch_add(1, std::memory_order_relaxed);
+      break;
+
+    case MethodResult::kFailed:
+      cnt_failed.fetch_add(1, std::memory_order_relaxed);
+      break;
+
+    case MethodResult::kChanged:
+      cnt_changed.fetch_add(1, std::memory_order_relaxed);
+      break;
+    }
+  });
+
+  mgr.set_metric("changed", cnt_changed.load());
+  mgr.set_metric("failed", cnt_failed.load());
+  mgr.set_metric("no_clinit", cnt_no_clinit.load());
+  mgr.set_metric("below_threshold", cnt_below_threshold.load());
+  mgr.set_metric("not_one_block", cnt_not_one_block.load());
+  mgr.set_metric("all_enum", cnt_all.load());
+}
+
+static RearrangeEnumClinitPass s_pass;
+
+} // namespace rearrange_enum_clinit
diff --git a/opt/rearrange-enum-clinit/RearrangeEnumClinit.h b/opt/rearrange-enum-clinit/RearrangeEnumClinit.h
@@ -0,0 +1,46 @@
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
+ *
+ * This source code is licensed under the MIT license found in the
+ * LICENSE file in the root directory of this source tree.
+ */
+
+#pragma once
+
+#include "Pass.h"
+
+class DexMethod;
+class IRCode;
+
+namespace rearrange_enum_clinit {
+
+enum class MethodResult {
+  kUnknown,
+  kNotOneBlock,
+  kFailed,
+  kChanged,
+};
+
+class RearrangeEnumClinitPass : public Pass {
+ public:
+  RearrangeEnumClinitPass() : Pass("RearrangeEnumClinitPass") {}
+
+  redex_properties::PropertyInteractions get_property_interactions()
+      const override {
+    return redex_properties::simple::preserves_all();
+  }
+
+  void bind_config() override { bind("threshold", m_threshold, m_threshold); }
+
+  void run_pass(DexStoresVector&, ConfigFiles&, PassManager&) override;
+
+ private:
+  // "Exposed" for testing purposes.
+  static MethodResult run(DexMethod* m, IRCode* code);
+
+  size_t m_threshold{10000000};
+
+  friend class RearrangeEnumClinitTest;
+};
+
+} // namespace rearrange_enum_clinit
diff --git a/test/unit/Makefile.am b/test/unit/Makefile.am
@@ -105,6 +105,7 @@ check_PROGRAMS = \
     pure_analysis_test \
     random_forest_test \
     reaching_definitions_test \
+    rearrange_enum_clinit_test \
     reduce_array_literals_test \
     reduce_boolean_branches_test \
     reduce_gotos_test \
@@ -356,6 +357,8 @@ random_forest_test_SOURCES = RandomForestTest.cpp
 
 reaching_definitions_test_SOURCES = ReachingDefinitionsTest.cpp
 
+rearrange_enum_clinit_test_SOURCES = RearrangeEnumClinitTest.cpp
+
 reduce_array_literals_test_SOURCES = ReduceArrayLiteralsTest.cpp
 reduce_array_literals_test_LDADD = $(COMMON_MOCK_TEST_LIBS)