diff --git a/llvm/lib/Target/AIE/AIE1LegalizerInfo.cpp b/llvm/lib/Target/AIE/AIE1LegalizerInfo.cpp
new file mode 100644
index 000000000000..7971bff911e3
--- /dev/null
+++ b/llvm/lib/Target/AIE/AIE1LegalizerInfo.cpp
@@ -0,0 +1,299 @@
+//===- AIE1LegalizerInfo.cpp ----------------------------------------------===//
+//
+// This file is licensed under the Apache License v2.0 with LLVM Exceptions.
+// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+//
+// (c) Copyright 2023-2024 Advanced Micro Devices, Inc. or its affiliates
+//
+//===----------------------------------------------------------------------===//
+/// \file
+/// This file implements the targeting of the Machinelegalizer class for AIE.
+/// \todo This should be generated by TableGen.
+//===----------------------------------------------------------------------===//
+
+#include "AIE1LegalizerInfo.h"
+#include "AIEBaseISelLowering.h"
+#include "AIEBaseSubtarget.h"
+#include "AIELegalizerHelper.h"
+#include "llvm/Analysis/VectorUtils.h"
+#include "llvm/CodeGen/GlobalISel/LegalizerInfo.h"
+#include "llvm/CodeGen/MachineOperand.h"
+#include "llvm/CodeGen/TargetOpcodes.h"
+#include "llvm/CodeGenTypes/LowLevelType.h"
+#include <initializer_list>
+
+using namespace llvm;
+
+AIE1LegalizerInfo::AIE1LegalizerInfo(const AIEBaseSubtarget &ST)
+    : AIEHelper(ST) {
+  using namespace TargetOpcode;
+  const LLT S8 = LLT::scalar(8);
+  const LLT S16 = LLT::scalar(16);
+  const LLT S20 = LLT::scalar(20);
+  const LLT S32 = LLT::scalar(32);
+  const LLT S64 = LLT::scalar(64);
+  const LLT P0 = LLT::pointer(0, 20);
+
+  // 128-bit vectors
+  const LLT V16S8 = LLT::fixed_vector(16, 8);
+  const LLT V8S16 = LLT::fixed_vector(8, 16);
+  const LLT V4S32 = LLT::fixed_vector(4, 32);
+
+  // 256-bit vectors
+  const LLT V8S32 = LLT::fixed_vector(8, 32);
+  const LLT V16S16 = LLT::fixed_vector(16, 16);
+  const LLT V32S8 = LLT::fixed_vector(32, 8);
+
+  // 256-bit accumulators
+  const LLT ACC256 = LLT::fixed_vector(4, 64);
+
+  // 512-bit vectors
+  const LLT V16S32 = LLT::fixed_vector(16, 32);
+  const LLT V32S16 = LLT::fixed_vector(32, 16);
+  const LLT V64S8 = LLT::fixed_vector(64, 8);
+
+  // 512-bit accumulators
+  const LLT ACC512 = LLT::fixed_vector(8, 64);
+
+  // 1024-bit vectors
+  const LLT V32S32 = LLT::fixed_vector(32, 32);
+  const LLT V64S16 = LLT::fixed_vector(64, 16);
+  const LLT V128S8 = LLT::fixed_vector(128, 8);
+
+  // 1024-bit accumulators
+  const LLT ACC1024 = LLT::fixed_vector(16, 64);
+
+  const LLT S128 = LLT::scalar(128);
+
+  auto &IMPLICIT = getActionDefinitionsBuilder({G_IMPLICIT_DEF, G_FREEZE})
+                       .legalFor({S20, S32, P0, S128});
+
+  IMPLICIT.widenScalarToNextPow2(0).clampScalar(0, S32, S32);
+
+  getActionDefinitionsBuilder(G_CONSTANT)
+      .legalFor({S20, S32, P0})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S32);
+
+  // FIXME: AIE1 actually supports float
+  getActionDefinitionsBuilder(G_FCONSTANT).customFor({S16, S32, S64});
+
+  getActionDefinitionsBuilder(G_ICMP)
+      .legalFor({{S32, S32}, {S32, P0}})
+      .clampScalar(0, S32, S32)
+      .clampScalar(1, S32, S32);
+
+  getActionDefinitionsBuilder({G_FMUL, G_FDIV, G_FADD, G_FSUB, G_FREM})
+      .libcallFor({S32, S64});
+
+  // Since the only integers smaller than 32 bits we produce are S20 (from
+  // G_PTRTOINT), the only legal extension is S20 -> S32.
+  // Extensions to types larger than 64 bits have to be broken down into
+  // multiple parts.
+  getActionDefinitionsBuilder({G_ANYEXT, G_SEXT, G_ZEXT})
+      .legalFor({{S32, S20}})
+      .clampScalar(0, S32, S32);
+  // FIXME: (s|z|any)ext s20 to s64 is broken.
+
+  getActionDefinitionsBuilder({G_AND, G_OR})
+      .legalFor({S32})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S32);
+
+  getActionDefinitionsBuilder(G_XOR)
+      .legalFor({S32})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S32);
+
+  getActionDefinitionsBuilder(G_SEXT_INREG).custom();
+
+  getActionDefinitionsBuilder({G_ASHR, G_LSHR, G_SHL})
+      .legalFor({{S32, S32}})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S32)
+      .clampScalar(1, S32, S32);
+
+  getActionDefinitionsBuilder(G_TRUNC).alwaysLegal();
+
+  getActionDefinitionsBuilder(G_SELECT)
+      .legalFor({{S32, S32}, {P0, S32}})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S32)
+      .clampScalar(1, S32, S32);
+
+  getActionDefinitionsBuilder({G_ADD, G_SUB})
+      .legalFor({S32})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S32);
+
+  // FIXME: G_SADDE/G_SSUBE doesn't support lowering. To support this properly,
+  // the action needs to be implemented
+  getActionDefinitionsBuilder({G_UADDO, G_USUBO, G_UADDE, G_USUBE, G_SADDO,
+                               G_SSUBO, G_SADDE, G_SSUBE, G_UADDSAT, G_USUBSAT,
+                               G_SADDSAT, G_SSUBSAT})
+      .lower();
+
+  getActionDefinitionsBuilder(G_MUL)
+      .legalFor({S32})
+      .widenScalarToNextPow2(0)
+      .minScalar(0, S32)
+      .libcallFor({S64});
+
+  // FIXME: G_SMULO, G_UMULO support
+  getActionDefinitionsBuilder({G_UMULH, G_SMULH}).lower();
+
+  getActionDefinitionsBuilder({G_SDIV, G_UDIV, G_SREM, G_UREM})
+      .libcallFor({S32, S64})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S64);
+
+  getActionDefinitionsBuilder({G_SDIVREM, G_UDIVREM})
+      .lowerFor({S32, S64})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S64);
+
+  getActionDefinitionsBuilder(G_ABS)
+      .legalFor({S32})
+      .lowerFor({S64})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S32);
+
+  // The CLZ instruction implements CTLZ, which also covers CTLZ_ZERO_UNDEF
+  getActionDefinitionsBuilder(G_CTLZ_ZERO_UNDEF)
+      .lowerFor({{S32, S32}})
+      .clampScalar(0, S32, S32)
+      .clampScalar(1, S32, S32);
+
+  getActionDefinitionsBuilder(G_CTLZ)
+      .legalFor({{S32, S32}})
+      .clampScalar(0, S32, S32)
+      .clampScalar(1, S32, S32);
+
+  getActionDefinitionsBuilder({G_FSHL, G_FSHR}).lower();
+
+  getActionDefinitionsBuilder({G_MEMCPY, G_MEMSET, G_MEMMOVE})
+      .customIf([=](const LegalityQuery &Query) {
+        const LLT SizeArg = Query.Types[2];
+        return SizeArg == S20;
+      })
+      .libcall();
+
+  getActionDefinitionsBuilder(G_DYN_STACKALLOC).custom();
+  getActionDefinitionsBuilder({G_STACKSAVE, G_STACKRESTORE}).lower();
+
+  getActionDefinitionsBuilder({G_SMIN, G_SMAX, G_UMIN, G_UMAX})
+      .widenScalarToNextPow2(0, 32)
+      .lower();
+
+  getActionDefinitionsBuilder({G_FRAME_INDEX, G_GLOBAL_VALUE}).legalFor({P0});
+
+  getActionDefinitionsBuilder(G_INTTOPTR)
+      .legalFor({{P0, S20}})
+      .widenScalarToNextPow2(1)
+      .clampScalar(1, S20, S20);
+
+  getActionDefinitionsBuilder(G_PTRTOINT)
+      .legalFor({{S20, P0}})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S20, S20);
+
+  // We support pointer arithmetic on both GPRs (32-bits) and pointer regs
+  // (20-bits, where the scalar addend resides in a MOD register). To allow
+  // specifying alternative register bank mappings, we need to truncate the RHS
+  // operand to 20-bits, thus we only allow s20 types for the scalar addend
+  getActionDefinitionsBuilder(G_PTR_ADD)
+      .legalFor({{P0, S20}})
+      .widenScalarToNextPow2(1)
+      .clampScalar(1, S20, S20);
+
+  getActionDefinitionsBuilder({G_LOAD, G_STORE})
+      .legalForTypesWithMemDesc({
+          {S32, P0, S8, 8},         {S32, P0, S16, 16},
+          {S20, P0, S20, 32},       {S32, P0, S32, 32},
+          {P0, P0, S20, 32},        {V16S8, P0, V16S8, 16},
+          {V8S16, P0, V8S16, 16},   {V4S32, P0, V4S32, 16},
+          {V8S32, P0, V8S32, 32},   {V16S16, P0, V16S16, 32},
+          {V32S8, P0, V32S8, 32},   {V16S32, P0, V16S32, 32},
+          {V32S16, P0, V32S16, 32}, {V64S8, P0, V64S8, 32},
+          {V32S32, P0, V32S32, 32}, {V64S16, P0, V64S16, 32},
+          {V128S8, P0, V128S8, 32}, {ACC256, P0, ACC256, 32},
+          {ACC512, P0, ACC512, 32}, {ACC1024, P0, ACC1024, 32},
+          {S128, P0, S128, 16},
+      })
+      .widenScalarToNextPow2(0)
+      .lowerIfMemSizeNotPow2()
+      .bitcastIf(
+          [=](const LegalityQuery &Query) {
+            const LLT &Ty = Query.Types[0];
+            return Ty.isVector() &&
+                   (Ty.getSizeInBits() == 64 || Ty.getSizeInBits() == 32);
+          },
+          [=](const LegalityQuery &Query) {
+            const LLT Ty = Query.Types[0];
+            const unsigned Size = Ty.getSizeInBits();
+            assert(Size % 32 == 0);
+            return std::pair(0, LLT::scalar(Size));
+          })
+      .clampScalar(0, S32, S32)
+      .lower();
+
+  // FIXME: Storing a pointer to an un-aligned address isn't supported.
+  getActionDefinitionsBuilder({G_ZEXTLOAD, G_SEXTLOAD})
+      .legalForTypesWithMemDesc({{S32, P0, S8, 8}, {S32, P0, S16, 16}})
+      .widenScalarToNextPow2(0)
+      .lowerIfMemSizeNotPow2()
+      .clampScalar(0, S32, S32)
+      .lower();
+
+  // Control-flow
+  getActionDefinitionsBuilder(G_BRCOND).legalFor({S32}).clampScalar(0, S32,
+                                                                    S32);
+
+  getActionDefinitionsBuilder(G_PHI)
+      .legalFor({S20, S32, P0})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S32);
+
+  getActionDefinitionsBuilder(G_JUMP_TABLE).custom();
+
+  getActionDefinitionsBuilder(G_BRJT).custom();
+
+  getActionDefinitionsBuilder(G_BRINDIRECT).legalFor({P0});
+
+  // Variadic functions
+  getActionDefinitionsBuilder(G_VASTART).custom();
+  getActionDefinitionsBuilder(G_VAARG).custom();
+
+  getLegacyLegalizerInfo().computeTables();
+  verify(*ST.getInstrInfo());
+}
+
+bool AIE1LegalizerInfo::legalizeCustom(
+    LegalizerHelper &Helper, MachineInstr &MI,
+    LostDebugLocObserver &LocObserver) const {
+  switch (MI.getOpcode()) {
+  default:
+    break;
+  case TargetOpcode::G_VASTART:
+    return AIEHelper.legalizeG_VASTART(Helper, MI);
+  case TargetOpcode::G_VAARG:
+    return AIEHelper.legalizeG_VAARG(Helper, MI);
+  case TargetOpcode::G_MEMSET:
+  case TargetOpcode::G_MEMCPY:
+  case TargetOpcode::G_MEMMOVE:
+    return AIEHelper.legalizeMemCalls(Helper, MI, LocObserver);
+  case TargetOpcode::G_BRJT:
+    return AIEHelper.legalizeG_BRJT(Helper, MI);
+  case TargetOpcode::G_FCONSTANT:
+    return AIEHelper.legalizeG_FCONSTANT(Helper, MI);
+  case TargetOpcode::G_JUMP_TABLE:
+    return AIEHelper.legalizeG_JUMP_TABLE(Helper, MI);
+  case TargetOpcode::G_DYN_STACKALLOC:
+    return AIEHelper.legalizeG_DYN_STACKALLOC(Helper, MI);
+  case TargetOpcode::G_SEXT_INREG:
+    return AIEHelper.legalizeG_SEXT_INREG(Helper, MI);
+  }
+
+  llvm_unreachable("Un-expected custom legalization");
+}
diff --git a/llvm/lib/Target/AIE/AIE1LegalizerInfo.h b/llvm/lib/Target/AIE/AIE1LegalizerInfo.h
new file mode 100644
index 000000000000..eb26003576f0
--- /dev/null
+++ b/llvm/lib/Target/AIE/AIE1LegalizerInfo.h
@@ -0,0 +1,37 @@
+//===- AIELegalizerInfo.h ---------------------------------------*- C++ -*-===//
+//
+// This file is licensed under the Apache License v2.0 with LLVM Exceptions.
+// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+//
+// (c) Copyright 2023-2024 Advanced Micro Devices, Inc. or its affiliates
+//
+//===----------------------------------------------------------------------===//
+/// \file
+/// This file declares the targeting of the Machinelegalizer class for AIE.
+/// \todo This should be generated by TableGen.
+//===----------------------------------------------------------------------===//
+
+#ifndef LLVM_LIB_TARGET_AIE_AIE1MACHINELEGALIZER_H
+#define LLVM_LIB_TARGET_AIE_AIE1MACHINELEGALIZER_H
+
+#include "AIELegalizerHelper.h"
+#include "llvm/CodeGen/GlobalISel/LegalizerInfo.h"
+#include "llvm/CodeGen/Register.h"
+#include "llvm/IR/InstrTypes.h"
+
+namespace llvm {
+
+class AIEBaseSubtarget;
+
+/// This class provides legalization strategies.
+class AIE1LegalizerInfo : public LegalizerInfo {
+  AIELegalizerHelper AIEHelper;
+
+public:
+  AIE1LegalizerInfo(const AIEBaseSubtarget &ST);
+  bool legalizeCustom(LegalizerHelper &Helper, MachineInstr &MI,
+                      LostDebugLocObserver &LocObserver) const override;
+};
+} // end namespace llvm
+#endif
diff --git a/llvm/lib/Target/AIE/AIE2InstrInfo.cpp b/llvm/lib/Target/AIE/AIE2InstrInfo.cpp
index 9021bf019c30..deb7c1100c0a 100644
--- a/llvm/lib/Target/AIE/AIE2InstrInfo.cpp
+++ b/llvm/lib/Target/AIE/AIE2InstrInfo.cpp
@@ -744,6 +744,27 @@ unsigned AIE2InstrInfo::getCycleSeparatorOpcode() const {
   return AIE2::CYCLE_SEPARATOR;
 }
 
+unsigned AIE2InstrInfo::getGenericAddVectorEltOpcode() const {
+  return AIE2::G_AIE_ADD_VECTOR_ELT_LEFT;
+}
+
+unsigned AIE2InstrInfo::getGenericInsertVectorEltOpcode() const {
+  return AIE2::G_AIE_INSERT_VECTOR_ELT;
+}
+
+unsigned AIE2InstrInfo::getGenericExtractVectorEltOpcode(bool SignExt) const {
+  return SignExt ? AIE2::G_AIE_SEXT_EXTRACT_VECTOR_ELT
+                 : AIE2::G_AIE_ZEXT_EXTRACT_VECTOR_ELT;
+}
+
+unsigned AIE2InstrInfo::getGenericPadVectorOpcode() const {
+  return AIE2::G_AIE_PAD_VECTOR_UNDEF;
+}
+
+unsigned AIE2InstrInfo::getGenericUnpadVectorOpcode() const {
+  return AIE2::G_AIE_UNPAD_VECTOR;
+}
+
 unsigned int getVLDSparseOpcode(unsigned int PseudoOpc) {
   switch (PseudoOpc) {
   case AIE2::PSEUDO_VLD_SPARSE_POP_16_set_low:
diff --git a/llvm/lib/Target/AIE/AIE2InstrInfo.h b/llvm/lib/Target/AIE/AIE2InstrInfo.h
index 287d45f9fbf7..a4242838f958 100644
--- a/llvm/lib/Target/AIE/AIE2InstrInfo.h
+++ b/llvm/lib/Target/AIE/AIE2InstrInfo.h
@@ -42,6 +42,11 @@ class AIE2InstrInfo : public AIE2GenInstrInfo {
   unsigned getPseudoMoveOpcode() const override;
   unsigned getConstantMovOpcode(MachineRegisterInfo &MRI, unsigned int Reg,
                                 APInt &Val) const override;
+  unsigned getGenericAddVectorEltOpcode() const override;
+  unsigned getGenericInsertVectorEltOpcode() const override;
+  unsigned getGenericExtractVectorEltOpcode(bool SignExt) const override;
+  unsigned getGenericPadVectorOpcode() const override;
+  unsigned getGenericUnpadVectorOpcode() const override;
   unsigned getCycleSeparatorOpcode() const override;
   bool isLock(unsigned Opc) const override;
   bool isDelayedSchedBarrier(const MachineInstr &MI) const override;
diff --git a/llvm/lib/Target/AIE/AIE2LegalizerInfo.cpp b/llvm/lib/Target/AIE/AIE2LegalizerInfo.cpp
index efedcaab9564..0f3538aba2b5 100644
--- a/llvm/lib/Target/AIE/AIE2LegalizerInfo.cpp
+++ b/llvm/lib/Target/AIE/AIE2LegalizerInfo.cpp
@@ -15,8 +15,534 @@
 
 #include "AIE2LegalizerInfo.h"
 #include "AIE2Subtarget.h"
+#include "llvm/CodeGen/GlobalISel/GenericMachineInstrs.h"
+#include "llvm/CodeGen/GlobalISel/LostDebugLocObserver.h"
+#include "llvm/CodeGen/GlobalISel/MachineIRBuilder.h"
 
 using namespace llvm;
+using namespace LegalityPredicates;
 
-AIE2LegalizerInfo::AIE2LegalizerInfo(const AIE2Subtarget &STI)
-    : AIELegalizerInfo(STI) {}
+static LegalityPredicate isLegalBitCastType(unsigned TypeIdx) {
+  return [=](const LegalityQuery &Query) {
+    LLT Ty = Query.Types[TypeIdx];
+    if (Ty.isScalar())
+      return Ty == LLT::scalar(32) || Ty == LLT::scalar(64);
+    const int EltSize = Ty.isVector() ? Ty.getElementType().getSizeInBits() : 0;
+    return EltSize == 8 || EltSize == 16 || EltSize == 32 || EltSize == 64;
+  };
+}
+
+static LegalizeMutation bitcastAccToVectorType(unsigned TypeIdx) {
+  return [=](const LegalityQuery &Query) {
+    LLT OrigTy = Query.Types[TypeIdx];
+    assert(OrigTy.getElementType() == LLT::scalar(64) &&
+           "Expected an accumulator type");
+    unsigned Size = OrigTy.getSizeInBits();
+    assert(Size % 32 == 0);
+    return std::pair(TypeIdx, LLT::fixed_vector(Size / 32, 32));
+  };
+}
+
+static LegalizeMutation bitcastToVectorElement32(const unsigned TypeIdx) {
+  return [=](const LegalityQuery &Query) {
+    const LLT Ty = Query.Types[TypeIdx];
+    unsigned Size = Ty.getSizeInBits();
+    assert(Size % 32 == 0);
+    return std::pair(
+        TypeIdx, LLT::scalarOrVector(ElementCount::getFixed(Size / 32), 32));
+  };
+}
+
+static LegalityPredicate
+isValidVectorMergeUnmergeOp(const unsigned BigVectorId,
+                            const unsigned SmallVectorId) {
+  return [=](const LegalityQuery &Query) {
+    const LLT Big = Query.Types[BigVectorId];
+    const LLT Small = Query.Types[SmallVectorId];
+    return Big.isVector() && Small.isVector() &&
+           Big.getElementType() == Small.getElementType() &&
+           Small.getNumElements() * 2 == Big.getNumElements();
+  };
+}
+
+static LegalityPredicate isValidVectorAIE2(const unsigned TypeIdx) {
+  return [=](const LegalityQuery &Query) {
+    const LLT DstTy = Query.Types[TypeIdx];
+    const unsigned DstSize = DstTy.getSizeInBits();
+    return DstTy.isVector() && (DstSize == 32 || DstSize > 64);
+  };
+}
+
+LegalityPredicate
+negatePredicate(const std::function<bool(const LegalityQuery &)> &Func) {
+  return [=](const LegalityQuery &Query) { return !Func(Query); };
+}
+
+AIE2LegalizerInfo::AIE2LegalizerInfo(const AIE2Subtarget &ST) : AIEHelper(ST) {
+  using namespace TargetOpcode;
+  const LLT S8 = LLT::scalar(8);
+  const LLT S16 = LLT::scalar(16);
+  const LLT S20 = LLT::scalar(20);
+  const LLT S32 = LLT::scalar(32);
+  const LLT S64 = LLT::scalar(64);
+  const LLT P0 = LLT::pointer(0, 20);
+
+  // 32-bit vectors
+  const LLT V4S8 = LLT::fixed_vector(4, 8);
+  const LLT V2S16 = LLT::fixed_vector(2, 16);
+
+  // 64-bit vectors
+  const LLT V2S32 = LLT::fixed_vector(2, 32);
+
+  // 128-bit vectors
+  const LLT V16S8 = LLT::fixed_vector(16, 8);
+  const LLT V8S16 = LLT::fixed_vector(8, 16);
+  const LLT V4S32 = LLT::fixed_vector(4, 32);
+
+  // 256-bit vectors
+  const LLT V8S32 = LLT::fixed_vector(8, 32);
+  const LLT V16S16 = LLT::fixed_vector(16, 16);
+  const LLT V32S8 = LLT::fixed_vector(32, 8);
+
+  // 256-bit accumulators
+  const LLT ACC256 = LLT::fixed_vector(4, 64);
+
+  // 512-bit vectors
+  const LLT V16S32 = LLT::fixed_vector(16, 32);
+  const LLT V32S16 = LLT::fixed_vector(32, 16);
+  const LLT V64S8 = LLT::fixed_vector(64, 8);
+
+  // 512-bit accumulators
+  const LLT ACC512 = LLT::fixed_vector(8, 64);
+
+  // 1024-bit vectors
+  const LLT V32S32 = LLT::fixed_vector(32, 32);
+  const LLT V64S16 = LLT::fixed_vector(64, 16);
+  const LLT V128S8 = LLT::fixed_vector(128, 8);
+
+  // 1024-bit accumulators
+  const LLT ACC1024 = LLT::fixed_vector(16, 64);
+
+  const LLT S128 = LLT::scalar(128);
+
+  static const std::initializer_list<LLT> AIE2VectorTypes = {
+      /* Begin 32-bit types*/
+      V4S8, V2S16,
+      /* Begin 256-bit types */
+      V8S32, V16S16, V32S8,
+      /* Begin 512-bit types */
+      V16S32, V32S16, V64S8,
+      /* Begin 1024-bit types */
+      V32S32, V64S16, V128S8};
+
+  // Accumulator types are 32-bit vectors that pretend to 64-bit vectors of
+  // half the size.
+  static const std::initializer_list<LLT> AIE2AccumulatorTypes = {
+      /* Begin 256-bit types */
+      ACC256,
+      /* Begin 512-bit types */
+      ACC512,
+      /* Begin 1024-bit types */
+      ACC1024};
+
+  getActionDefinitionsBuilder({G_IMPLICIT_DEF, G_FREEZE})
+      .legalFor({S20, S32, P0, S128})
+      .legalFor(AIE2VectorTypes)
+      .legalFor(AIE2AccumulatorTypes)
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S32);
+
+  getActionDefinitionsBuilder(G_CONSTANT)
+      .legalFor({S20, S32, P0})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S32);
+
+  // FIXME: AIE1 actually supports float. But since AIE2 is using the same
+  // legalizer, we will cast both type to int now.
+  getActionDefinitionsBuilder(G_FCONSTANT).customFor({S16, S32, S64});
+
+  getActionDefinitionsBuilder(G_ICMP)
+      .legalFor({{S32, S32}, {S32, P0}})
+      .clampScalar(0, S32, S32)
+      .clampScalar(1, S32, S32);
+
+  getActionDefinitionsBuilder(G_FCMP)
+      .clampScalar(0, S32, S32)
+      .customFor({{S32, S16}, {S32, S32}});
+
+  getActionDefinitionsBuilder(G_FPTRUNC)
+      .libcallFor({{S32, S64}})
+      .customFor({{S16, S32}});
+
+  getActionDefinitionsBuilder({G_SITOFP, G_UITOFP})
+      .libcallForCartesianProduct({S32, S64})
+      .clampScalar(1, S32, S64)
+      .widenScalarToNextPow2(1)
+      .clampScalar(0, S32, S64);
+
+  getActionDefinitionsBuilder(G_FPEXT)
+      .libcallFor({{S64, S32}})
+      .customFor({{S32, S16}})
+      .narrowScalarFor({{S64, S16}}, llvm::LegalizeMutations::changeTo(0, S32));
+
+  getActionDefinitionsBuilder({G_FPTOSI, G_FPTOUI})
+      .libcallForCartesianProduct({S32, S64})
+      .clampScalar(0, S32, S64)
+      .widenScalarToNextPow2(0)
+      .clampScalar(1, S32, S64);
+
+  getActionDefinitionsBuilder(G_FABS).customFor({S16, S32, S64});
+
+  getActionDefinitionsBuilder({G_FADD, G_FSUB})
+      .legalFor({V16S32})
+      .customFor({S16})
+      .libcallFor({S32, S64});
+
+  getActionDefinitionsBuilder({G_FMUL, G_FDIV, G_FREM})
+      .clampScalar(0, S32, S64)
+      .libcallFor({S32, S64});
+
+  // Since the only integers smaller than 32 bits we produce are S20 (from
+  // G_PTRTOINT), the only legal extension is S20 -> S32.
+  // Extensions to types larger than 64 bits have to be broken down into
+  // multiple parts.
+  getActionDefinitionsBuilder({G_ANYEXT, G_SEXT, G_ZEXT})
+      .legalFor({{S32, S20}})
+      .clampScalar(0, S32, S32);
+  // FIXME: (s|z|any)ext s20 to s64 is broken.
+
+  getActionDefinitionsBuilder({G_AND, G_OR})
+      .legalFor({S32})
+      .legalFor(AIE2VectorTypes)
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S32);
+
+  getActionDefinitionsBuilder(G_XOR)
+      .legalFor({S32})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S32);
+
+  getActionDefinitionsBuilder(G_SEXT_INREG).custom();
+
+  getActionDefinitionsBuilder({G_ASHR, G_LSHR, G_SHL})
+      .legalFor({{S32, S32}})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S32)
+      .clampScalar(1, S32, S32);
+
+  getActionDefinitionsBuilder(G_TRUNC).alwaysLegal();
+
+  getActionDefinitionsBuilder(G_SELECT)
+      .legalFor({{S32, S32}, {P0, S32}})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S32)
+      .clampScalar(1, S32, S32)
+      .legalFor(AIE2VectorTypes)
+      // We support G_SELECT only on the vector register bank
+      // Mapping the G_SELECT operands to the vector register bank
+      // during register bank selection introduces the proper cross-bank
+      // copies. However, we cannot write ISEL patterns expressing accumulator
+      // types on vector register banks, which requires to duplicate the vector
+      // type patterns in C++. Introducing bitcasts during legalization allows
+      // to re-use the existing code for register bank selection and ISEL
+      // patterns.
+      .bitcastIf(typeInSet(0, AIE2AccumulatorTypes), bitcastAccToVectorType(0));
+
+  getActionDefinitionsBuilder({G_ADD, G_SUB})
+      .legalFor({S32})
+      .legalFor({V16S32, V32S16, V64S8})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S32);
+
+  // FIXME: G_SADDE/G_SSUBE doesn't support lowering. To support this properly,
+  // the action needs to be implemented
+  // FIXME: AIE2 has ADC and SBC operations to read the carry.
+  getActionDefinitionsBuilder({G_UADDO, G_USUBO, G_UADDE, G_USUBE, G_SADDO,
+                               G_SSUBO, G_SADDE, G_SSUBE, G_UADDSAT, G_USUBSAT,
+                               G_SADDSAT, G_SSUBSAT})
+      .lower();
+
+  getActionDefinitionsBuilder(G_MUL)
+      .legalFor({S32})
+      .widenScalarToNextPow2(0)
+      .minScalar(0, S32)
+      .libcallFor({S64});
+
+  // FIXME: G_SMULO, G_UMULO support
+  getActionDefinitionsBuilder({G_UMULH, G_SMULH}).lower();
+
+  getActionDefinitionsBuilder({G_SDIV, G_UDIV, G_SREM, G_UREM})
+      .libcallFor({S32, S64})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S64);
+
+  getActionDefinitionsBuilder({G_SDIVREM, G_UDIVREM})
+      .lowerFor({S32, S64})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S64);
+
+  getActionDefinitionsBuilder(G_ABS)
+      .legalFor({S32})
+      .lowerFor({S64})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S32);
+
+  // The CLZ instruction implements CTLZ, which also covers CTLZ_ZERO_UNDEF
+  getActionDefinitionsBuilder(G_CTLZ_ZERO_UNDEF)
+      .lowerFor({{S32, S32}})
+      .clampScalar(0, S32, S32)
+      .clampScalar(1, S32, S32);
+
+  getActionDefinitionsBuilder(G_CTLZ)
+      .legalFor({{S32, S32}})
+      .clampScalar(0, S32, S32)
+      .clampScalar(1, S32, S32);
+
+  getActionDefinitionsBuilder({G_FSHL, G_FSHR}).lower();
+
+  getActionDefinitionsBuilder({G_MEMCPY, G_MEMSET, G_MEMMOVE})
+      .customIf([=](const LegalityQuery &Query) {
+        const LLT SizeArg = Query.Types[2];
+        return SizeArg == S20;
+      })
+      .libcall();
+
+  getActionDefinitionsBuilder(G_DYN_STACKALLOC).custom();
+  getActionDefinitionsBuilder({G_STACKSAVE, G_STACKRESTORE}).lower();
+
+  getActionDefinitionsBuilder({G_SMIN, G_SMAX, G_UMIN, G_UMAX})
+      .widenScalarToNextPow2(0, 32)
+      .lower();
+
+  getActionDefinitionsBuilder({G_FRAME_INDEX, G_GLOBAL_VALUE}).legalFor({P0});
+
+  getActionDefinitionsBuilder(G_INTTOPTR)
+      .legalFor({{P0, S20}})
+      .widenScalarToNextPow2(1)
+      .clampScalar(1, S20, S20);
+
+  getActionDefinitionsBuilder(G_PTRTOINT)
+      .legalFor({{S20, P0}})
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S20, S20);
+
+  // We support pointer arithmetic on both GPRs (32-bits) and pointer regs
+  // (20-bits, where the scalar addend resides in a MOD register). To allow
+  // specifying alternative register bank mappings, we need to truncate the RHS
+  // operand to 20-bits, thus we only allow s20 types for the scalar addend
+  getActionDefinitionsBuilder(G_PTR_ADD)
+      .legalFor({{P0, S20}})
+      .widenScalarToNextPow2(1)
+      .clampScalar(1, S20, S20);
+
+  getActionDefinitionsBuilder({G_LOAD, G_STORE})
+      .legalForTypesWithMemDesc({
+          {S32, P0, S8, 8},         {S32, P0, S16, 16},
+          {S20, P0, S20, 32},       {S32, P0, S32, 32},
+          {P0, P0, S20, 32},        {V16S8, P0, V16S8, 16},
+          {V8S16, P0, V8S16, 16},   {V4S32, P0, V4S32, 16},
+          {V8S32, P0, V8S32, 32},   {V16S16, P0, V16S16, 32},
+          {V32S8, P0, V32S8, 32},   {V16S32, P0, V16S32, 32},
+          {V32S16, P0, V32S16, 32}, {V64S8, P0, V64S8, 32},
+          {V32S32, P0, V32S32, 32}, {V64S16, P0, V64S16, 32},
+          {V128S8, P0, V128S8, 32}, {ACC256, P0, ACC256, 32},
+          {ACC512, P0, ACC512, 32}, {ACC1024, P0, ACC1024, 32},
+          {S128, P0, S128, 16},
+      })
+      .widenScalarToNextPow2(0)
+      .lowerIfMemSizeNotPow2()
+      .bitcastIf(
+          [=](const LegalityQuery &Query) {
+            const LLT &Ty = Query.Types[0];
+            return Ty.isVector() &&
+                   (Ty.getSizeInBits() == 64 || Ty.getSizeInBits() == 32);
+          },
+          [=](const LegalityQuery &Query) {
+            const LLT Ty = Query.Types[0];
+            const unsigned Size = Ty.getSizeInBits();
+            assert(Size % 32 == 0);
+            return std::pair(0, LLT::scalar(Size));
+          })
+      .clampScalar(0, S32, S32)
+      .lower();
+
+  // FIXME: Storing a pointer to an un-aligned address isn't supported.
+  getActionDefinitionsBuilder({G_ZEXTLOAD, G_SEXTLOAD})
+      .legalForTypesWithMemDesc({{S32, P0, S8, 8}, {S32, P0, S16, 16}})
+      .widenScalarToNextPow2(0)
+      .lowerIfMemSizeNotPow2()
+      .clampScalar(0, S32, S32)
+      .lower();
+
+  getActionDefinitionsBuilder(G_EXTRACT_VECTOR_ELT)
+      .unsupportedIf([=](const LegalityQuery &Query) {
+        const LLT &EltTy = Query.Types[1].getElementType();
+        return Query.Types[0] != EltTy;
+      })
+      // If it is 32-bit, the LLVM can perform some bitshifts to legalize it
+      .bitcastIf(
+          [=](const LegalityQuery &Query) {
+            const LLT &VecTy = Query.Types[1];
+            return VecTy.getSizeInBits() == 32;
+          },
+          bitcastToVectorElement32(1))
+      // Extraction is supported for the native types of 32-, 256-, 512- and
+      // 1024-bit
+      .customIf(typeInSet(1, {V4S8, V2S16, V2S32, V8S32, V16S32, V32S32, V16S16,
+                              V32S8, V32S16, V64S8, V64S16, V128S8}))
+      // For 16-bits, we want to increase the number of elements to 4. Since
+      // our architecture doesn't always support all intermediate sizes, we do
+      // it as a special case so that we can use them minimum clamp for the
+      // smallest vector register.
+      .moreElementsIf(
+          [=](const LegalityQuery &Query) {
+            return Query.Types[1].getScalarSizeInBits() == 8 &&
+                   Query.Types[1].getNumElements() == 2;
+          },
+          [=](const LegalityQuery &Query) {
+            return std::make_pair(1, LLT::fixed_vector(4, S8));
+          })
+      // Increase the input vectors if they don't fit in the smallest vector
+      // register
+      .clampMinNumElements(1, S8, 32)
+      .clampMinNumElements(1, S16, 16)
+      .clampMinNumElements(1, S32, 8);
+
+  getActionDefinitionsBuilder(G_INSERT_VECTOR_ELT)
+      .clampScalar(2, S32, S32) // Clamp the idx to 32 bit since VINSERT
+                                // relies on eR29 only for idx.
+      .customIf(typeInSet(0, {V2S32, V8S32, V16S16, V32S8, V16S32, V32S16,
+                              V64S8, V32S32, V64S16, V128S8}));
+
+  // Control-flow
+  getActionDefinitionsBuilder(G_BRCOND).legalFor({S32}).clampScalar(0, S32,
+                                                                    S32);
+
+  getActionDefinitionsBuilder(G_PHI)
+      .legalFor({S20, S32, P0})
+      .legalFor(AIE2VectorTypes)
+      .legalFor(AIE2AccumulatorTypes)
+      .widenScalarToNextPow2(0)
+      .clampScalar(0, S32, S32);
+
+  const LegalityPredicate IsNotValidDestinationVector =
+      negatePredicate(isValidVectorAIE2(0));
+
+  getActionDefinitionsBuilder(G_BITCAST).legalIf(
+      LegalityPredicates::all(isLegalBitCastType(0), isLegalBitCastType(1)));
+
+  getActionDefinitionsBuilder(G_MERGE_VALUES).legalFor({{S64, S32}});
+  getActionDefinitionsBuilder(G_UNMERGE_VALUES)
+      .legalFor({{S32, S64}, {S32, V2S32}})
+      .customIf([=](const LegalityQuery &Query) {
+        const LLT &DstTy = Query.Types[0];
+        const LLT &SrcTy = Query.Types[1];
+
+        return SrcTy.isVector() && DstTy.isScalar() &&
+               DstTy == SrcTy.getElementType();
+      })
+      .unsupportedIf(IsNotValidDestinationVector)
+      .legalIf(isValidVectorMergeUnmergeOp(1, 0));
+
+  getActionDefinitionsBuilder(G_CONCAT_VECTORS)
+      .unsupportedIf(IsNotValidDestinationVector)
+      .legalIf(isValidVectorMergeUnmergeOp(0, 1));
+
+  getActionDefinitionsBuilder(G_BUILD_VECTOR)
+      // Legacy legalization for bitcasts
+      .legalFor({{V2S32, S32}})
+      .unsupportedIf(IsNotValidDestinationVector)
+      // We clamp the high values and not the low ones, sice the former
+      // splits the values but the latter keeps the same G_BUILD_VECTOR in
+      // the output instructions which causes an infinite loop since it
+      // can't reach our custom legalization code.
+      .clampMaxNumElements(0, S8, 64)
+      .clampMaxNumElements(0, S16, 32)
+      .clampMaxNumElements(0, S32, 16)
+      .custom();
+
+  getActionDefinitionsBuilder(G_SHUFFLE_VECTOR)
+      .unsupportedIf(IsNotValidDestinationVector)
+      // Checks if the shuffle is "canonical", this enables additional actions
+      // in the LLVM combiner and can change shuffle vectors legalization
+      .lowerIf([=](const LegalityQuery &Query) {
+        return Query.Types[0] == Query.Types[1];
+      })
+      .lower();
+
+  getActionDefinitionsBuilder(G_JUMP_TABLE).custom();
+
+  getActionDefinitionsBuilder(G_BRJT).custom();
+
+  getActionDefinitionsBuilder(G_BRINDIRECT).legalFor({P0});
+
+  // Variadic functions
+  getActionDefinitionsBuilder(G_VASTART).custom();
+  getActionDefinitionsBuilder(G_VAARG).custom();
+
+  getLegacyLegalizerInfo().computeTables();
+  verify(*ST.getInstrInfo());
+}
+
+bool AIE2LegalizerInfo::legalizeCustom(
+    LegalizerHelper &Helper, MachineInstr &MI,
+    LostDebugLocObserver &LocObserver) const {
+  switch (MI.getOpcode()) {
+  default:
+    break;
+  case TargetOpcode::G_VASTART:
+    return AIEHelper.legalizeG_VASTART(Helper, MI);
+  case TargetOpcode::G_VAARG:
+    return AIEHelper.legalizeG_VAARG(Helper, MI);
+  case TargetOpcode::G_MEMSET:
+  case TargetOpcode::G_MEMCPY:
+  case TargetOpcode::G_MEMMOVE:
+    return AIEHelper.legalizeMemCalls(Helper, MI, LocObserver);
+  case TargetOpcode::G_BRJT:
+    return AIEHelper.legalizeG_BRJT(Helper, MI);
+  case TargetOpcode::G_FCONSTANT:
+    return AIEHelper.legalizeG_FCONSTANT(Helper, MI);
+  case TargetOpcode::G_JUMP_TABLE:
+    return AIEHelper.legalizeG_JUMP_TABLE(Helper, MI);
+  case TargetOpcode::G_DYN_STACKALLOC:
+    return AIEHelper.legalizeG_DYN_STACKALLOC(Helper, MI);
+  case TargetOpcode::G_EXTRACT_VECTOR_ELT:
+    return AIEHelper.legalizeG_EXTRACT_VECTOR_ELT(Helper, MI);
+  case TargetOpcode::G_INSERT_VECTOR_ELT:
+    return AIEHelper.legalizeG_INSERT_VECTOR_ELT(Helper, MI);
+  case TargetOpcode::G_FCMP:
+    return AIEHelper.legalizeG_FCMP(Helper, MI, LocObserver);
+  case TargetOpcode::G_FPTRUNC:
+    return AIEHelper.legalizeG_FPTRUNC(Helper, MI);
+  case TargetOpcode::G_FPEXT:
+    return AIEHelper.legalizeG_FPEXT(Helper, MI);
+  case TargetOpcode::G_FABS:
+    return AIEHelper.legalizeG_FABS(Helper, MI);
+  case TargetOpcode::G_FADD:
+  case TargetOpcode::G_FSUB:
+    return AIEHelper.legalizeG_FADDSUB(Helper, MI);
+  case TargetOpcode::G_BUILD_VECTOR:
+    return AIEHelper.legalizeG_BUILD_VECTOR(Helper, MI);
+  case TargetOpcode::G_UNMERGE_VALUES:
+    return AIEHelper.legalizeG_UNMERGE_VALUES(Helper, MI);
+  case TargetOpcode::G_SEXT_INREG:
+    return AIEHelper.legalizeG_SEXT_INREG(Helper, MI);
+  }
+
+  llvm_unreachable("Un-expected custom legalization");
+}
+
+bool AIE2LegalizerInfo::legalizeIntrinsic(LegalizerHelper &Helper,
+                                          MachineInstr &MI) const {
+
+  // The loop_decrement is a bit of an exception in legalization since it
+  // is an architecture-neutral intrinsic to implement hardware loops, not a
+  // dedicated AIE intrinsic. As such it carries a boolean, which should be
+  // legalized to a 32 bit integer type.
+  switch (cast<GIntrinsic>(MI).getIntrinsicID()) {
+  case Intrinsic::loop_decrement:
+    return AIEHelper.legalizeLoopDecrement(Helper, MI);
+  }
+
+  return true;
+}
diff --git a/llvm/lib/Target/AIE/AIE2LegalizerInfo.h b/llvm/lib/Target/AIE/AIE2LegalizerInfo.h
index f5d15f7b045d..25688470e0f2 100644
--- a/llvm/lib/Target/AIE/AIE2LegalizerInfo.h
+++ b/llvm/lib/Target/AIE/AIE2LegalizerInfo.h
@@ -1,4 +1,4 @@
-//===- AIE2LegalizerInfo ----------------------------------------*- C++ -*-===//
+//===- AIE2LegalizerInfo.h --------------------------------------*- C++ -*-===//
 //
 // This file is licensed under the Apache License v2.0 with LLVM Exceptions.
 // See https://llvm.org/LICENSE.txt for license information.
@@ -16,16 +16,23 @@
 #ifndef LLVM_LIB_TARGET_AIE2_AIE2MACHINELEGALIZER_H
 #define LLVM_LIB_TARGET_AIE2_AIE2MACHINELEGALIZER_H
 
-#include "AIELegalizerInfo.h"
+#include "AIELegalizerHelper.h"
+#include "llvm/CodeGen/GlobalISel/LegalizerInfo.h"
 
 namespace llvm {
 
 class AIE2Subtarget;
 
 /// This class provides legalization strategies.
-class AIE2LegalizerInfo : public AIELegalizerInfo {
+class AIE2LegalizerInfo : public LegalizerInfo {
+  AIELegalizerHelper AIEHelper;
+
 public:
   AIE2LegalizerInfo(const AIE2Subtarget &ST);
+  bool legalizeCustom(LegalizerHelper &Helper, MachineInstr &MI,
+                      LostDebugLocObserver &LocObserver) const override;
+  bool legalizeIntrinsic(LegalizerHelper &Helper,
+                         MachineInstr &MI) const override;
 };
 } // end namespace llvm
 #endif
diff --git a/llvm/lib/Target/AIE/AIEBaseInstrInfo.h b/llvm/lib/Target/AIE/AIEBaseInstrInfo.h
index 4825a33482b3..c09e5d3cd5e5 100644
--- a/llvm/lib/Target/AIE/AIEBaseInstrInfo.h
+++ b/llvm/lib/Target/AIE/AIEBaseInstrInfo.h
@@ -84,6 +84,33 @@ struct AIEBaseInstrInfo : public TargetInstrInfo {
   virtual unsigned getCycleSeparatorOpcode() const {
     llvm_unreachable("Target didn't implement getCycleSeparatorOpcode");
   }
+  /// Return the opcode to be used for pushing a vector element at the LSB
+  /// position in a vector
+  virtual unsigned getGenericAddVectorEltOpcode() const {
+    llvm_unreachable("Target didn't implement getGenericAddVectorEltOpcode");
+  }
+  /// Return the opcode to be used for inserting a vector element at an
+  /// arbitrary position in a vector
+  virtual unsigned getGenericInsertVectorEltOpcode() const {
+    llvm_unreachable("Target didn't implement getGenericInsertVectorEltOpcode");
+  }
+  /// Return the opcode to be used for extracting a vector element
+  /// \param signExt True if the extracted element shall be sign extended
+  virtual unsigned getGenericExtractVectorEltOpcode(bool SignExt) const {
+    llvm_unreachable(
+        "Target didn't implement getGenericExtractVectorEltOpcode");
+    ;
+  }
+  /// Return the opcode to be used for padding undefined values in the high bits
+  /// of a vector
+  virtual unsigned getGenericPadVectorOpcode() const {
+    llvm_unreachable("Target didn't implement getGenericPadVectorOpcode");
+  }
+  /// Return the opcode to be used for extracting a smaller vector by ignoring
+  /// the high bits
+  virtual unsigned getGenericUnpadVectorOpcode() const {
+    llvm_unreachable("Target didn't implement getGenericUnpadVectorOpcode");
+  }
   /// Check whether Opc represents a lock instruction
   virtual bool isLock(unsigned Opc) const { return false; }
   /// Check whether this is a delayed scheduling barrier induced from
diff --git a/llvm/lib/Target/AIE/AIELegalizerInfo.cpp b/llvm/lib/Target/AIE/AIELegalizerHelper.cpp
similarity index 56%
rename from llvm/lib/Target/AIE/AIELegalizerInfo.cpp
rename to llvm/lib/Target/AIE/AIELegalizerHelper.cpp
index 8c456c3e2f08..cedb3dd4c491 100644
--- a/llvm/lib/Target/AIE/AIELegalizerInfo.cpp
+++ b/llvm/lib/Target/AIE/AIELegalizerHelper.cpp
@@ -1,4 +1,4 @@
-//===- AIELegalizerInfo.cpp -----------------------------------------------===//
+//===- AIELegalizerHelper.cpp --------------------------------------------===//
 //
 // This file is licensed under the Apache License v2.0 with LLVM Exceptions.
 // See https://llvm.org/LICENSE.txt for license information.
@@ -8,578 +8,31 @@
 //
 //===----------------------------------------------------------------------===//
 /// \file
-/// This file implements the targeting of the Machinelegalizer class for AIE.
-/// \todo This should be generated by TableGen.
+/// This file implements AIE specific legalization functions
 //===----------------------------------------------------------------------===//
 
-#include "AIELegalizerInfo.h"
-#include "AIE2TargetMachine.h"
+#include "AIELegalizerHelper.h"
 #include "AIEBaseISelLowering.h"
-#include "AIEBaseRegisterInfo.h"
+#include "AIEBaseInstrInfo.h"
+#include "AIEBaseSubtarget.h"
 #include "AIEMachineFunctionInfo.h"
-#include "AIETargetMachine.h"
-#include "MCTargetDesc/AIEMCTargetDesc.h"
-#include "llvm/Analysis/VectorUtils.h"
-#include "llvm/CodeGen/GlobalISel/CallLowering.h"
 #include "llvm/CodeGen/GlobalISel/GenericMachineInstrs.h"
-#include "llvm/CodeGen/GlobalISel/LegalizerHelper.h"
-#include "llvm/CodeGen/GlobalISel/LegalizerInfo.h"
-#include "llvm/CodeGen/GlobalISel/LostDebugLocObserver.h"
 #include "llvm/CodeGen/GlobalISel/MachineIRBuilder.h"
-#include "llvm/CodeGen/MachineInstrBuilder.h"
-#include "llvm/CodeGen/MachineMemOperand.h"
-#include "llvm/CodeGen/MachineOperand.h"
-#include "llvm/CodeGen/MachineRegisterInfo.h"
-#include "llvm/CodeGen/Register.h"
 #include "llvm/CodeGen/RuntimeLibcalls.h"
-#include "llvm/CodeGen/SelectionDAGNodes.h"
 #include "llvm/CodeGen/TargetOpcodes.h"
-#include "llvm/CodeGenTypes/LowLevelType.h"
-#include "llvm/IR/IntrinsicsAIE.h"
 #include "llvm/IR/IntrinsicsAIE2.h"
-#include "llvm/Support/Alignment.h"
-#include <initializer_list>
-
-using namespace llvm;
-using namespace LegalityPredicates;
-
-static LegalityPredicate isLegalBitCastType(unsigned TypeIdx) {
-  return [=](const LegalityQuery &Query) {
-    LLT Ty = Query.Types[TypeIdx];
-    if (Ty.isScalar())
-      return Ty == LLT::scalar(32) || Ty == LLT::scalar(64);
-    const int EltSize = Ty.isVector() ? Ty.getElementType().getSizeInBits() : 0;
-    return EltSize == 8 || EltSize == 16 || EltSize == 32 || EltSize == 64;
-  };
-}
-
-static LegalizeMutation bitcastAccToVectorType(unsigned TypeIdx) {
-  return [=](const LegalityQuery &Query) {
-    LLT OrigTy = Query.Types[TypeIdx];
-    assert(OrigTy.getElementType() == LLT::scalar(64) &&
-           "Expected an accumulator type");
-    unsigned Size = OrigTy.getSizeInBits();
-    assert(Size % 32 == 0);
-    return std::pair(TypeIdx, LLT::fixed_vector(Size / 32, 32));
-  };
-}
-
-static LegalizeMutation bitcastToVectorElement32(const unsigned TypeIdx) {
-  return [=](const LegalityQuery &Query) {
-    const LLT Ty = Query.Types[TypeIdx];
-    unsigned Size = Ty.getSizeInBits();
-    assert(Size % 32 == 0);
-    return std::pair(
-        TypeIdx, LLT::scalarOrVector(ElementCount::getFixed(Size / 32), 32));
-  };
-}
-
-static LegalityPredicate
-isValidVectorMergeUnmergeOp(const unsigned BigVectorId,
-                            const unsigned SmallVectorId) {
-  return [=](const LegalityQuery &Query) {
-    const LLT Big = Query.Types[BigVectorId];
-    const LLT Small = Query.Types[SmallVectorId];
-    return Big.isVector() && Small.isVector() &&
-           Big.getElementType() == Small.getElementType() &&
-           Small.getNumElements() * 2 == Big.getNumElements();
-  };
-}
-
-static LegalityPredicate isValidVectorAIE2(const unsigned TypeIdx) {
-  return [=](const LegalityQuery &Query) {
-    const LLT DstTy = Query.Types[TypeIdx];
-    const unsigned DstSize = DstTy.getSizeInBits();
-    return DstTy.isVector() && (DstSize == 32 || DstSize > 64);
-  };
-}
-
-LegalityPredicate
-negatePredicate(const std::function<bool(const LegalityQuery &)> &Func) {
-  return [=](const LegalityQuery &Query) { return !Func(Query); };
-}
-
-AIELegalizerInfo::AIELegalizerInfo(const AIEBaseSubtarget &ST) {
-  using namespace TargetOpcode;
-  const LLT S8 = LLT::scalar(8);
-  const LLT S16 = LLT::scalar(16);
-  const LLT S20 = LLT::scalar(20);
-  const LLT S32 = LLT::scalar(32);
-  const LLT S64 = LLT::scalar(64);
-  const LLT P0 = LLT::pointer(0, 20);
-
-  // 32-bit vectors
-  const LLT V4S8 = LLT::fixed_vector(4, 8);
-  const LLT V2S16 = LLT::fixed_vector(2, 16);
-
-  // 64-bit vectors
-  const LLT V2S32 = LLT::fixed_vector(2, 32);
-
-  // 128-bit vectors
-  const LLT V16S8 = LLT::fixed_vector(16, 8);
-  const LLT V8S16 = LLT::fixed_vector(8, 16);
-  const LLT V4S32 = LLT::fixed_vector(4, 32);
-
-  // 256-bit vectors
-  const LLT V8S32 = LLT::fixed_vector(8, 32);
-  const LLT V16S16 = LLT::fixed_vector(16, 16);
-  const LLT V32S8 = LLT::fixed_vector(32, 8);
-
-  // 256-bit accumulators
-  const LLT ACC256 = LLT::fixed_vector(4, 64);
-
-  // 512-bit vectors
-  const LLT V16S32 = LLT::fixed_vector(16, 32);
-  const LLT V32S16 = LLT::fixed_vector(32, 16);
-  const LLT V64S8 = LLT::fixed_vector(64, 8);
-
-  // 512-bit accumulators
-  const LLT ACC512 = LLT::fixed_vector(8, 64);
-
-  // 1024-bit vectors
-  const LLT V32S32 = LLT::fixed_vector(32, 32);
-  const LLT V64S16 = LLT::fixed_vector(64, 16);
-  const LLT V128S8 = LLT::fixed_vector(128, 8);
-
-  // 1024-bit accumulators
-  const LLT ACC1024 = LLT::fixed_vector(16, 64);
-
-  const LLT S128 = LLT::scalar(128);
-
-  static const std::initializer_list<LLT> AIE2VectorTypes = {
-      /* Begin 32-bit types*/
-      V4S8, V2S16,
-      /* Begin 256-bit types */
-      V8S32, V16S16, V32S8,
-      /* Begin 512-bit types */
-      V16S32, V32S16, V64S8,
-      /* Begin 1024-bit types */
-      V32S32, V64S16, V128S8};
-
-  // Accumulator types are 32-bit vectors that pretend to 64-bit vectors of
-  // half the size.
-  static const std::initializer_list<LLT> AIE2AccumulatorTypes = {
-      /* Begin 256-bit types */
-      ACC256,
-      /* Begin 512-bit types */
-      ACC512,
-      /* Begin 1024-bit types */
-      ACC1024};
-
-  auto &IMPLICIT = getActionDefinitionsBuilder({G_IMPLICIT_DEF, G_FREEZE})
-                       .legalFor({S20, S32, P0, S128});
-  if (ST.isAIE2()) {
-    IMPLICIT.legalFor(AIE2VectorTypes);
-    IMPLICIT.legalFor(AIE2AccumulatorTypes);
-  }
-
-  IMPLICIT.widenScalarToNextPow2(0).clampScalar(0, S32, S32);
-
-  getActionDefinitionsBuilder(G_CONSTANT)
-      .legalFor({S20, S32, P0})
-      .widenScalarToNextPow2(0)
-      .clampScalar(0, S32, S32);
-
-  // FIXME: AIE1 actually supports float. But since AIE2 is using the same
-  // legalizer, we will cast both type to int now.
-  getActionDefinitionsBuilder(G_FCONSTANT).customFor({S16, S32, S64});
-
-  getActionDefinitionsBuilder(G_ICMP)
-      .legalFor({{S32, S32}, {S32, P0}})
-      .clampScalar(0, S32, S32)
-      .clampScalar(1, S32, S32);
-
-  if (ST.isAIE2()) {
-    getActionDefinitionsBuilder(G_FCMP)
-        .clampScalar(0, S32, S32)
-        .customFor({{S32, S16}, {S32, S32}});
-
-    getActionDefinitionsBuilder(G_FPTRUNC)
-        .libcallFor({{S32, S64}})
-        .customFor({{S16, S32}});
-
-    getActionDefinitionsBuilder({G_SITOFP, G_UITOFP})
-        .libcallForCartesianProduct({S32, S64})
-        .clampScalar(1, S32, S64)
-        .widenScalarToNextPow2(1)
-        .clampScalar(0, S32, S64);
-
-    getActionDefinitionsBuilder(G_FPEXT)
-        .libcallFor({{S64, S32}})
-        .customFor({{S32, S16}})
-        .narrowScalarFor({{S64, S16}},
-                         llvm::LegalizeMutations::changeTo(0, S32));
-
-    getActionDefinitionsBuilder({G_FPTOSI, G_FPTOUI})
-        .libcallForCartesianProduct({S32, S64})
-        .clampScalar(0, S32, S64)
-        .widenScalarToNextPow2(0)
-        .clampScalar(1, S32, S64);
-
-    getActionDefinitionsBuilder(G_FABS).customFor({S16, S32, S64});
-
-    getActionDefinitionsBuilder({G_FADD, G_FSUB})
-        .legalFor({V16S32})
-        .customFor({S16})
-        .libcallFor({S32, S64});
-
-    getActionDefinitionsBuilder({G_FMUL, G_FDIV, G_FREM})
-        .clampScalar(0, S32, S64)
-        .libcallFor({S32, S64});
-  }
-
-  if (!ST.isAIE2())
-    getActionDefinitionsBuilder({G_FMUL, G_FDIV, G_FADD, G_FSUB, G_FREM})
-        .libcallFor({S32, S64});
-
-  // Since the only integers smaller than 32 bits we produce are S20 (from
-  // G_PTRTOINT), the only legal extension is S20 -> S32.
-  // Extensions to types larger than 64 bits have to be broken down into
-  // multiple parts.
-  getActionDefinitionsBuilder({G_ANYEXT, G_SEXT, G_ZEXT})
-      .legalFor({{S32, S20}})
-      .clampScalar(0, S32, S32);
-  // FIXME: (s|z|any)ext s20 to s64 is broken.
-
-  auto &VANDOR = getActionDefinitionsBuilder({G_AND, G_OR})
-                     .legalFor({S32})
-                     .widenScalarToNextPow2(0)
-                     .clampScalar(0, S32, S32);
-
-  if (ST.isAIE2())
-    VANDOR.legalFor(AIE2VectorTypes);
-
-  getActionDefinitionsBuilder(G_XOR)
-      .legalFor({S32})
-      .widenScalarToNextPow2(0)
-      .clampScalar(0, S32, S32);
-
-  getActionDefinitionsBuilder(G_SEXT_INREG)
-      .custom()
-      .legalForTypeWithAnyImm({S32});
-
-  getActionDefinitionsBuilder({G_ASHR, G_LSHR, G_SHL})
-      .legalFor({{S32, S32}})
-      .widenScalarToNextPow2(0)
-      .clampScalar(0, S32, S32)
-      .clampScalar(1, S32, S32);
-
-  getActionDefinitionsBuilder(G_TRUNC).alwaysLegal();
-
-  auto &SELECT = getActionDefinitionsBuilder(G_SELECT)
-                     .legalFor({{S32, S32}, {P0, S32}})
-                     .widenScalarToNextPow2(0)
-                     .clampScalar(0, S32, S32)
-                     .clampScalar(1, S32, S32);
-
-  if (ST.isAIE2()) {
-    SELECT.legalFor(AIE2VectorTypes);
-
-    // We support G_SELECT only on the vector register bank
-    // Mapping the G_SELECT operands to the vector register bank
-    // during register bank selection introduces the proper cross-bank
-    // copies. However, we cannot write ISEL patterns expressing accumulator
-    // types on vector register banks, which requires to duplicate the vector
-    // type patterns in C++. Introducing bitcasts during legalization allows to
-    // re-use the existing code for register bank selection and ISEL patterns.
-    SELECT.bitcastIf(typeInSet(0, AIE2AccumulatorTypes),
-                     bitcastAccToVectorType(0));
-  }
-  auto &ADDSUB = getActionDefinitionsBuilder({G_ADD, G_SUB})
-                     .legalFor({S32})
-                     .widenScalarToNextPow2(0)
-                     .clampScalar(0, S32, S32);
-
-  if (ST.isAIE2())
-    ADDSUB.legalFor({V16S32, V32S16, V64S8});
-
-  // FIXME: G_SADDE/G_SSUBE doesn't support lowering. To support this properly,
-  // the action needs to be implemented
-  // FIXME: AIE2 has ADC and SBC operations to read the carry.
-  getActionDefinitionsBuilder({G_UADDO, G_USUBO, G_UADDE, G_USUBE, G_SADDO,
-                               G_SSUBO, G_SADDE, G_SSUBE, G_UADDSAT, G_USUBSAT,
-                               G_SADDSAT, G_SSUBSAT})
-      .lower();
-
-  getActionDefinitionsBuilder(G_MUL)
-      .legalFor({S32})
-      .widenScalarToNextPow2(0)
-      .minScalar(0, S32)
-      .libcallFor({S64});
-
-  // FIXME: G_SMULO, G_UMULO support
-  getActionDefinitionsBuilder({G_UMULH, G_SMULH}).lower();
-
-  getActionDefinitionsBuilder({G_SDIV, G_UDIV, G_SREM, G_UREM})
-      .libcallFor({S32, S64})
-      .widenScalarToNextPow2(0)
-      .clampScalar(0, S32, S64);
-
-  getActionDefinitionsBuilder({G_SDIVREM, G_UDIVREM})
-      .lowerFor({S32, S64})
-      .widenScalarToNextPow2(0)
-      .clampScalar(0, S32, S64);
-
-  getActionDefinitionsBuilder(G_ABS)
-      .legalFor({S32})
-      .lowerFor({S64})
-      .widenScalarToNextPow2(0)
-      .clampScalar(0, S32, S32);
-
-  // The CLZ instruction implements CTLZ, which also covers CTLZ_ZERO_UNDEF
-  getActionDefinitionsBuilder(G_CTLZ_ZERO_UNDEF)
-      .lowerFor({{S32, S32}})
-      .clampScalar(0, S32, S32)
-      .clampScalar(1, S32, S32);
-
-  getActionDefinitionsBuilder(G_CTLZ)
-      .legalFor({{S32, S32}})
-      .clampScalar(0, S32, S32)
-      .clampScalar(1, S32, S32);
-
-  getActionDefinitionsBuilder({G_FSHL, G_FSHR}).lower();
-
-  getActionDefinitionsBuilder({G_MEMCPY, G_MEMSET, G_MEMMOVE})
-      .customIf([=](const LegalityQuery &Query) {
-        const LLT SizeArg = Query.Types[2];
-        return SizeArg == S20;
-      })
-      .libcall();
-
-  getActionDefinitionsBuilder(G_DYN_STACKALLOC).custom();
-  getActionDefinitionsBuilder({G_STACKSAVE, G_STACKRESTORE}).lower();
-
-  getActionDefinitionsBuilder({G_SMIN, G_SMAX, G_UMIN, G_UMAX})
-      .widenScalarToNextPow2(0, 32)
-      .lower();
-
-  getActionDefinitionsBuilder({G_FRAME_INDEX, G_GLOBAL_VALUE}).legalFor({P0});
-
-  getActionDefinitionsBuilder(G_INTTOPTR)
-      .legalFor({{P0, S20}})
-      .widenScalarToNextPow2(1)
-      .clampScalar(1, S20, S20);
-
-  getActionDefinitionsBuilder(G_PTRTOINT)
-      .legalFor({{S20, P0}})
-      .widenScalarToNextPow2(0)
-      .clampScalar(0, S20, S20);
-
-  // We support pointer arithmetic on both GPRs (32-bits) and pointer regs
-  // (20-bits, where the scalar addend resides in a MOD register). To allow
-  // specifying alternative register bank mappings, we need to truncate the RHS
-  // operand to 20-bits, thus we only allow s20 types for the scalar addend
-  getActionDefinitionsBuilder(G_PTR_ADD)
-      .legalFor({{P0, S20}})
-      .widenScalarToNextPow2(1)
-      .clampScalar(1, S20, S20);
-
-  getActionDefinitionsBuilder({G_LOAD, G_STORE})
-      .legalForTypesWithMemDesc({
-          {S32, P0, S8, 8},         {S32, P0, S16, 16},
-          {S20, P0, S20, 32},       {S32, P0, S32, 32},
-          {P0, P0, S20, 32},        {V16S8, P0, V16S8, 16},
-          {V8S16, P0, V8S16, 16},   {V4S32, P0, V4S32, 16},
-          {V8S32, P0, V8S32, 32},   {V16S16, P0, V16S16, 32},
-          {V32S8, P0, V32S8, 32},   {V16S32, P0, V16S32, 32},
-          {V32S16, P0, V32S16, 32}, {V64S8, P0, V64S8, 32},
-          {V32S32, P0, V32S32, 32}, {V64S16, P0, V64S16, 32},
-          {V128S8, P0, V128S8, 32}, {ACC256, P0, ACC256, 32},
-          {ACC512, P0, ACC512, 32}, {ACC1024, P0, ACC1024, 32},
-          {S128, P0, S128, 16},
-      })
-      .widenScalarToNextPow2(0)
-      .lowerIfMemSizeNotPow2()
-      .bitcastIf(
-          [=](const LegalityQuery &Query) {
-            const LLT &Ty = Query.Types[0];
-            return Ty.isVector() &&
-                   (Ty.getSizeInBits() == 64 || Ty.getSizeInBits() == 32);
-          },
-          [=](const LegalityQuery &Query) {
-            const LLT Ty = Query.Types[0];
-            const unsigned Size = Ty.getSizeInBits();
-            assert(Size % 32 == 0);
-            return std::pair(0, LLT::scalar(Size));
-          })
-      .clampScalar(0, S32, S32)
-      .lower();
-
-  // FIXME: Storing a pointer to an un-aligned address isn't supported.
-  getActionDefinitionsBuilder({G_ZEXTLOAD, G_SEXTLOAD})
-      .legalForTypesWithMemDesc({{S32, P0, S8, 8}, {S32, P0, S16, 16}})
-      .widenScalarToNextPow2(0)
-      .lowerIfMemSizeNotPow2()
-      .clampScalar(0, S32, S32)
-      .lower();
-
-  if (ST.isAIE2()) {
-    getActionDefinitionsBuilder(G_EXTRACT_VECTOR_ELT)
-        .unsupportedIf([=](const LegalityQuery &Query) {
-          const LLT &EltTy = Query.Types[1].getElementType();
-          return Query.Types[0] != EltTy;
-        })
-        // If it is 32-bit, the LLVM can perform some bitshifts to legalize it
-        .bitcastIf(
-            [=](const LegalityQuery &Query) {
-              const LLT &VecTy = Query.Types[1];
-              return VecTy.getSizeInBits() == 32;
-            },
-            bitcastToVectorElement32(1))
-        // Extraction is supported for the native types of 32-, 256-, 512- and
-        // 1024-bit
-        .customIf(typeInSet(1, {V4S8, V2S16, V2S32, V8S32, V16S32, V32S32,
-                                V16S16, V32S8, V32S16, V64S8, V64S16, V128S8}))
-        // For 16-bits, we want to increase the number of elements to 4. Since
-        // our architecture doesn't always support all intermediate sizes, we do
-        // it as a special case so that we can use them minimum clamp for the
-        // smallest vector register.
-        .moreElementsIf(
-            [=](const LegalityQuery &Query) {
-              return Query.Types[1].getScalarSizeInBits() == 8 &&
-                     Query.Types[1].getNumElements() == 2;
-            },
-            [=](const LegalityQuery &Query) {
-              return std::make_pair(1, LLT::fixed_vector(4, S8));
-            })
-        // Increase the input vectors if they don't fit in the smallest vector
-        // register
-        .clampMinNumElements(1, S8, 32)
-        .clampMinNumElements(1, S16, 16)
-        .clampMinNumElements(1, S32, 8);
-
-    getActionDefinitionsBuilder(G_INSERT_VECTOR_ELT)
-        .clampScalar(2, S32, S32) // Clamp the idx to 32 bit since VINSERT
-                                  // relies on eR29 only for idx.
-        .customIf(typeInSet(0, {V2S32, V8S32, V16S16, V32S8, V16S32, V32S16,
-                                V64S8, V32S32, V64S16, V128S8}));
-  }
-
-  // Control-flow
-  getActionDefinitionsBuilder(G_BRCOND).legalFor({S32}).clampScalar(0, S32,
-                                                                    S32);
-
-  auto &PHI = getActionDefinitionsBuilder(G_PHI).legalFor({S20, S32, P0});
-
-  if (ST.isAIE2()) {
-    PHI.legalFor(AIE2VectorTypes);
-    PHI.legalFor(AIE2AccumulatorTypes);
-  }
-
-  PHI.widenScalarToNextPow2(0).clampScalar(0, S32, S32);
-
-  // Bitcast - vector source and vector destination - For AIEV2
-  if (ST.isAIE2()) {
-    const LegalityPredicate IsNotValidDestinationVector =
-        negatePredicate(isValidVectorAIE2(0));
-
-    getActionDefinitionsBuilder(G_BITCAST).legalIf(
-        LegalityPredicates::all(isLegalBitCastType(0), isLegalBitCastType(1)));
-
-    getActionDefinitionsBuilder(G_MERGE_VALUES).legalFor({{S64, S32}});
-    getActionDefinitionsBuilder(G_UNMERGE_VALUES)
-        .legalFor({{S32, S64}, {S32, V2S32}})
-        .customIf([=](const LegalityQuery &Query) {
-          const LLT &DstTy = Query.Types[0];
-          const LLT &SrcTy = Query.Types[1];
-
-          return SrcTy.isVector() && DstTy.isScalar() &&
-                 DstTy == SrcTy.getElementType();
-        })
-        .unsupportedIf(IsNotValidDestinationVector)
-        .legalIf(isValidVectorMergeUnmergeOp(1, 0));
-
-    getActionDefinitionsBuilder(G_CONCAT_VECTORS)
-        .unsupportedIf(IsNotValidDestinationVector)
-        .legalIf(isValidVectorMergeUnmergeOp(0, 1));
-
-    getActionDefinitionsBuilder(G_BUILD_VECTOR)
-        // Legacy legalization for bitcasts
-        .legalFor({{V2S32, S32}})
-        .unsupportedIf(IsNotValidDestinationVector)
-        // We clamp the high values and not the low ones, sice the former
-        // splits the values but the latter keeps the same G_BUILD_VECTOR in
-        // the output instructions which causes an infinite loop since it
-        // can't reach our custom legalization code.
-        .clampMaxNumElements(0, S8, 64)
-        .clampMaxNumElements(0, S16, 32)
-        .clampMaxNumElements(0, S32, 16)
-        .custom();
-
-    getActionDefinitionsBuilder(G_SHUFFLE_VECTOR)
-        .unsupportedIf(IsNotValidDestinationVector)
-        // Checks if the shuffle is "canonical", this enables additional actions
-        // in the LLVM combiner and can change shuffle vectors legalization
-        .lowerIf([=](const LegalityQuery &Query) {
-          return Query.Types[0] == Query.Types[1];
-        })
-        .lower();
-  }
 
-  getActionDefinitionsBuilder(G_JUMP_TABLE).custom();
+namespace llvm {
 
-  getActionDefinitionsBuilder(G_BRJT).custom();
+AIELegalizerHelper::AIELegalizerHelper(const AIEBaseSubtarget &ST) : ST(ST) {}
 
-  getActionDefinitionsBuilder(G_BRINDIRECT).legalFor({P0});
-
-  // Variadic functions
-  getActionDefinitionsBuilder(G_VASTART).custom();
-  getActionDefinitionsBuilder(G_VAARG).custom();
-
-  getLegacyLegalizerInfo().computeTables();
-  verify(*ST.getInstrInfo());
-}
-
-bool AIELegalizerInfo::legalizeCustom(LegalizerHelper &Helper, MachineInstr &MI,
-                                      LostDebugLocObserver &LocObserver) const {
-  switch (MI.getOpcode()) {
-  default:
-    break;
-  case TargetOpcode::G_VASTART:
-    return legalizeG_VASTART(Helper, MI);
-  case TargetOpcode::G_VAARG:
-    return legalizeG_VAARG(Helper, MI);
-  case TargetOpcode::G_MEMSET:
-  case TargetOpcode::G_MEMCPY:
-  case TargetOpcode::G_MEMMOVE:
-    return legalizeMemCalls(Helper, MI, LocObserver);
-  case TargetOpcode::G_BRJT:
-    return legalizeG_BRJT(Helper, MI);
-  case TargetOpcode::G_FCONSTANT:
-    return legalizeG_FCONSTANT(Helper, MI);
-  case TargetOpcode::G_JUMP_TABLE:
-    return legalizeG_JUMP_TABLE(Helper, MI);
-  case TargetOpcode::G_DYN_STACKALLOC:
-    return legalizeG_DYN_STACKALLOC(Helper, MI);
-  case TargetOpcode::G_EXTRACT_VECTOR_ELT:
-    return legalizeG_EXTRACT_VECTOR_ELT(Helper, MI);
-  case TargetOpcode::G_INSERT_VECTOR_ELT:
-    return legalizeG_INSERT_VECTOR_ELT(Helper, MI);
-  case TargetOpcode::G_FCMP:
-    return legalizeG_FCMP(Helper, MI, LocObserver);
-  case TargetOpcode::G_FPTRUNC:
-    return legalizeG_FPTRUNC(Helper, MI);
-  case TargetOpcode::G_FPEXT:
-    return legalizeG_FPEXT(Helper, MI);
-  case TargetOpcode::G_FABS:
-    return legalizeG_FABS(Helper, MI);
-  case TargetOpcode::G_FADD:
-  case TargetOpcode::G_FSUB:
-    return legalizeG_FADDSUB(Helper, MI);
-  case TargetOpcode::G_BUILD_VECTOR:
-    return legalizeG_BUILD_VECTOR(Helper, MI);
-  case TargetOpcode::G_UNMERGE_VALUES:
-    return legalizeG_UNMERGE_VALUES(Helper, MI);
-  case TargetOpcode::G_SEXT_INREG:
-    return legalizeG_SEXT_INREG(Helper, MI);
-  }
-
-  llvm_unreachable("Un-expected custom legalization");
+const AIEBaseInstrInfo *AIELegalizerHelper::getInstrInfo() {
+  return ST.getInstrInfo();
 }
 
-bool AIELegalizerInfo::pack32BitVector(LegalizerHelper &Helper,
-                                       MachineInstr &MI,
-                                       Register SourceReg) const {
+bool AIELegalizerHelper::pack32BitVector(LegalizerHelper &Helper,
+                                         MachineInstr &MI,
+                                         Register SourceReg) const {
   MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
   MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
 
@@ -603,7 +56,7 @@ bool AIELegalizerInfo::pack32BitVector(LegalizerHelper &Helper,
 
     if (RegTy.getScalarSizeInBits() != 32) {
       const Register TmpReg32 = MRI.createGenericVirtualRegister(S32);
-      MIRBuilder.buildInstr(AIE2::G_ZEXT, {TmpReg32}, {DestinationOperand});
+      MIRBuilder.buildZExt({TmpReg32}, {DestinationOperand});
       DestinationOperand = TmpReg32;
     }
 
@@ -630,9 +83,9 @@ bool AIELegalizerInfo::pack32BitVector(LegalizerHelper &Helper,
   return true;
 }
 
-bool AIELegalizerInfo::unpack32BitVector(LegalizerHelper &Helper,
-                                         MachineInstr &MI,
-                                         Register SourceReg) const {
+bool AIELegalizerHelper::unpack32BitVector(LegalizerHelper &Helper,
+                                           MachineInstr &MI,
+                                           Register SourceReg) const {
   MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
   MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
 
@@ -671,8 +124,8 @@ bool AIELegalizerInfo::unpack32BitVector(LegalizerHelper &Helper,
   return true;
 }
 
-bool AIELegalizerInfo::legalizeG_BUILD_VECTOR(LegalizerHelper &Helper,
-                                              MachineInstr &MI) const {
+bool AIELegalizerHelper::legalizeG_BUILD_VECTOR(LegalizerHelper &Helper,
+                                                MachineInstr &MI) const {
   MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
   MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
 
@@ -698,6 +151,7 @@ bool AIELegalizerInfo::legalizeG_BUILD_VECTOR(LegalizerHelper &Helper,
   Register Src = MRI.createGenericVirtualRegister(VecTy);
   MIRBuilder.buildUndef(Src);
 
+  const AIEBaseInstrInfo *II = ST.getInstrInfo();
   MachineOperand *OperandBegin = MI.operands_begin(),
                  *Operand = MI.operands_end() - 1;
   while (Operand != OperandBegin) {
@@ -712,11 +166,12 @@ bool AIELegalizerInfo::legalizeG_BUILD_VECTOR(LegalizerHelper &Helper,
     if (DstVecEltTy.getSizeInBits() != 32) {
       const Register TmpReg32 =
           MRI.createGenericVirtualRegister(LLT::scalar(32));
-      MIRBuilder.buildInstr(AIE2::G_ANYEXT, {TmpReg32}, {Reg});
+      MIRBuilder.buildAnyExt({TmpReg32}, {Reg});
       Reg = TmpReg32;
     }
 
-    MIRBuilder.buildInstr(AIE2::G_AIE_ADD_VECTOR_ELT_LEFT, {Dst}, {Src, Reg});
+    MIRBuilder.buildInstr(II->getGenericAddVectorEltOpcode(), {Dst},
+                          {Src, Reg});
     Src = Dst;
     --Operand;
   }
@@ -729,17 +184,18 @@ bool AIELegalizerInfo::legalizeG_BUILD_VECTOR(LegalizerHelper &Helper,
     const Register UnusedSubReg = MRI.createGenericVirtualRegister(DstVecTy);
     MIRBuilder.buildUnmerge({DstReg, UnusedSubReg}, Src);
   } else if (DstVecSize == 128) {
-    MIRBuilder.buildInstr(AIE2::G_AIE_UNPAD_VECTOR, {DstReg}, {Src});
+    MIRBuilder.buildInstr(II->getGenericUnpadVectorOpcode(), {DstReg}, {Src});
   }
 
   MI.eraseFromParent();
   return true;
 }
 
-bool AIELegalizerInfo::legalizeG_UNMERGE_VALUES(LegalizerHelper &Helper,
-                                                MachineInstr &MI) const {
+bool AIELegalizerHelper::legalizeG_UNMERGE_VALUES(LegalizerHelper &Helper,
+                                                  MachineInstr &MI) const {
   MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
   MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
+  const AIEBaseInstrInfo *II = ST.getInstrInfo();
 
   const Register FirstReg = MI.getOperand(0).getReg();
   const Register LastReg = MI.getOperand(MI.getNumOperands() - 1).getReg();
@@ -759,7 +215,7 @@ bool AIELegalizerInfo::legalizeG_UNMERGE_VALUES(LegalizerHelper &Helper,
     const LLT NewRegTy =
         LLT::fixed_vector(LastTy.getNumElements() * 2, LastTy.getScalarType());
     const Register NewReg = MRI.createGenericVirtualRegister(NewRegTy);
-    MIRBuilder.buildInstr(AIE2::G_AIE_PAD_VECTOR_UNDEF, {NewReg}, {LastReg});
+    MIRBuilder.buildInstr(II->getGenericPadVectorOpcode(), {NewReg}, {LastReg});
     TargetReg = NewReg;
   }
 
@@ -781,8 +237,8 @@ bool AIELegalizerInfo::legalizeG_UNMERGE_VALUES(LegalizerHelper &Helper,
   return true;
 }
 
-bool AIELegalizerInfo::legalizeG_SEXT_INREG(LegalizerHelper &Helper,
-                                            MachineInstr &MI) const {
+bool AIELegalizerHelper::legalizeG_SEXT_INREG(LegalizerHelper &Helper,
+                                              MachineInstr &MI) const {
 
   MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
   MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
@@ -798,8 +254,8 @@ bool AIELegalizerInfo::legalizeG_SEXT_INREG(LegalizerHelper &Helper,
   return true;
 }
 
-bool AIELegalizerInfo::legalizeG_VASTART(LegalizerHelper &Helper,
-                                         MachineInstr &MI) const {
+bool AIELegalizerHelper::legalizeG_VASTART(LegalizerHelper &Helper,
+                                           MachineInstr &MI) const {
   MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
   MachineFunction &MF = MIRBuilder.getMF();
   auto *FuncInfo = MF.getInfo<AIEMachineFunctionInfo>();
@@ -819,8 +275,8 @@ bool AIELegalizerInfo::legalizeG_VASTART(LegalizerHelper &Helper,
   return true;
 }
 
-bool AIELegalizerInfo::legalizeG_VAARG(LegalizerHelper &Helper,
-                                       MachineInstr &MI) const {
+bool AIELegalizerHelper::legalizeG_VAARG(LegalizerHelper &Helper,
+                                         MachineInstr &MI) const {
   MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
   MachineFunction &MF = MIRBuilder.getMF();
   MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
@@ -866,7 +322,7 @@ bool AIELegalizerInfo::legalizeG_VAARG(LegalizerHelper &Helper,
   return true;
 }
 
-bool AIELegalizerInfo::legalizeMemCalls(
+bool AIELegalizerHelper::legalizeMemCalls(
     LegalizerHelper &Helper, MachineInstr &MI,
     LostDebugLocObserver &LocObserver) const {
   MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
@@ -921,8 +377,8 @@ bool AIELegalizerInfo::legalizeMemCalls(
   return true;
 }
 
-bool AIELegalizerInfo::legalizeG_BRJT(LegalizerHelper &Helper,
-                                      MachineInstr &MI) const {
+bool AIELegalizerHelper::legalizeG_BRJT(LegalizerHelper &Helper,
+                                        MachineInstr &MI) const {
   MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
   MachineFunction &MF = MIRBuilder.getMF();
   LLT S32 = LLT::scalar(32);
@@ -945,8 +401,8 @@ bool AIELegalizerInfo::legalizeG_BRJT(LegalizerHelper &Helper,
   return true;
 }
 
-bool AIELegalizerInfo::legalizeG_FCONSTANT(LegalizerHelper &Helper,
-                                           MachineInstr &MI) const {
+bool AIELegalizerHelper::legalizeG_FCONSTANT(LegalizerHelper &Helper,
+                                             MachineInstr &MI) const {
   MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
   LLVMContext &Ctx = MIRBuilder.getMF().getFunction().getContext();
 
@@ -958,8 +414,8 @@ bool AIELegalizerInfo::legalizeG_FCONSTANT(LegalizerHelper &Helper,
   return true;
 }
 
-bool AIELegalizerInfo::legalizeG_JUMP_TABLE(LegalizerHelper &Helper,
-                                            MachineInstr &MI) const {
+bool AIELegalizerHelper::legalizeG_JUMP_TABLE(LegalizerHelper &Helper,
+                                              MachineInstr &MI) const {
   Helper.Observer.changingInstr(MI);
   MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
   MI.setDesc(MIRBuilder.getTII().get(TargetOpcode::G_GLOBAL_VALUE));
@@ -967,8 +423,8 @@ bool AIELegalizerInfo::legalizeG_JUMP_TABLE(LegalizerHelper &Helper,
   return true;
 }
 
-bool AIELegalizerInfo::legalizeG_DYN_STACKALLOC(LegalizerHelper &Helper,
-                                                MachineInstr &MI) const {
+bool AIELegalizerHelper::legalizeG_DYN_STACKALLOC(LegalizerHelper &Helper,
+                                                  MachineInstr &MI) const {
   MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
   const LLT P0 = LLT::pointer(0, 20);
   Register Dst = MI.getOperand(0).getReg();
@@ -990,8 +446,8 @@ bool AIELegalizerInfo::legalizeG_DYN_STACKALLOC(LegalizerHelper &Helper,
 //%3:_(s32) = G_AIE_SEXT_EXTRACT_VECTOR_ELT %0, %1
 //%4:_(s32) = G_ASSERT_SEXT %3, Elt_Size
 //%2:_(s8) = G_TRUNC %4
-bool AIELegalizerInfo::legalizeG_EXTRACT_VECTOR_ELT(LegalizerHelper &Helper,
-                                                    MachineInstr &MI) const {
+bool AIELegalizerHelper::legalizeG_EXTRACT_VECTOR_ELT(LegalizerHelper &Helper,
+                                                      MachineInstr &MI) const {
   MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
   MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
   const Register DstReg = MI.getOperand(0).getReg();
@@ -1027,20 +483,23 @@ bool AIELegalizerInfo::legalizeG_EXTRACT_VECTOR_ELT(LegalizerHelper &Helper,
   case 1024: {
     const LLT S8 = LLT::scalar(8);
     const LLT S16 = LLT::scalar(16);
+    const AIEBaseInstrInfo *II = ST.getInstrInfo();
     bool IsS32 = SrcVecEltTy == S32;
     assert((SrcVecEltTy == S8 || SrcVecEltTy == S16 || IsS32) &&
            "Unexpected vector element type for extract vector elt!");
     if (!IsS32) {
       const Register ExtEltDstReg = MRI.createGenericVirtualRegister(S32);
       const Register ExtDstReg = MRI.createGenericVirtualRegister(S32);
-      MIRBuilder.buildInstr(AIE2::G_AIE_SEXT_EXTRACT_VECTOR_ELT, {ExtEltDstReg},
-                            {SrcVecReg, IdxReg});
+      MIRBuilder.buildInstr(
+          II->getGenericExtractVectorEltOpcode(/*SignExt*/ true),
+          {ExtEltDstReg}, {SrcVecReg, IdxReg});
       MIRBuilder.buildAssertInstr(TargetOpcode::G_ASSERT_SEXT, ExtDstReg,
                                   ExtEltDstReg, SrcVecEltTy.getSizeInBits());
       MIRBuilder.buildTrunc(DstReg, ExtDstReg);
     } else {
-      MIRBuilder.buildInstr(AIE2::G_AIE_SEXT_EXTRACT_VECTOR_ELT, {DstReg},
-                            {SrcVecReg, IdxReg});
+      MIRBuilder.buildInstr(
+          II->getGenericExtractVectorEltOpcode(/*SignExt*/ true), {DstReg},
+          {SrcVecReg, IdxReg});
     }
     break;
   }
@@ -1051,8 +510,8 @@ bool AIELegalizerInfo::legalizeG_EXTRACT_VECTOR_ELT(LegalizerHelper &Helper,
   return true;
 }
 
-bool AIELegalizerInfo::legalizeG_INSERT_VECTOR_ELT(LegalizerHelper &Helper,
-                                                   MachineInstr &MI) const {
+bool AIELegalizerHelper::legalizeG_INSERT_VECTOR_ELT(LegalizerHelper &Helper,
+                                                     MachineInstr &MI) const {
   MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
   MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
   const Register DstVecReg = MI.getOperand(0).getReg();
@@ -1091,6 +550,7 @@ bool AIELegalizerInfo::legalizeG_INSERT_VECTOR_ELT(LegalizerHelper &Helper,
   case 512:
   case 1024: {
     const LLT ValTy = MRI.getType(ValReg);
+    const AIEBaseInstrInfo *II = ST.getInstrInfo();
     if (ValTy == LLT::scalar(64)) {
       llvm_unreachable("Unexpected scalar value type for insert vec elt!");
     }
@@ -1101,7 +561,7 @@ bool AIELegalizerInfo::legalizeG_INSERT_VECTOR_ELT(LegalizerHelper &Helper,
     } else {
       NewValReg = ValReg;
     }
-    MIRBuilder.buildInstr(AIE2::G_AIE_INSERT_VECTOR_ELT, {DstVecReg},
+    MIRBuilder.buildInstr(II->getGenericInsertVectorEltOpcode(), {DstVecReg},
                           {SrcVecReg, NewValReg, IdxReg});
     break;
   }
@@ -1158,7 +618,7 @@ static RTLIB::Libcall getFCmpLibCall(CmpInst::Predicate Predicate,
   }
 }
 
-bool AIELegalizerInfo::legalizeG_FCMP_FP32(
+bool AIELegalizerHelper::legalizeG_FCMP_FP32(
     LegalizerHelper &Helper, MachineInstr &MI,
     const CmpInst::Predicate FPredicate,
     LostDebugLocObserver &LocObserver) const {
@@ -1258,8 +718,9 @@ unsigned getFCmpIntrID(CmpInst::Predicate Predicate, bool &SwapOperands,
 /// Ordered predicates mentioned in \ref getFCmpIntrID are lowered to AIE2
 /// intrinsics, otherwise, they are promoted to fp32 and supported using
 /// libcalls.
-bool AIELegalizerInfo::legalizeG_FCMP(LegalizerHelper &Helper, MachineInstr &MI,
-                                      LostDebugLocObserver &LocObserver) const {
+bool AIELegalizerHelper::legalizeG_FCMP(
+    LegalizerHelper &Helper, MachineInstr &MI,
+    LostDebugLocObserver &LocObserver) const {
   MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
   MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
   auto &CmpMI = cast<GFCmp>(MI);
@@ -1307,7 +768,7 @@ bool AIELegalizerInfo::legalizeG_FCMP(LegalizerHelper &Helper, MachineInstr &MI,
 
   auto CreateAndInsert = [&](const Register &SrcReg) {
     Register Vec512Reg = MRI.createGenericVirtualRegister(V32S16);
-    MIRBuilder.buildInstr(AIE2::G_INSERT_VECTOR_ELT, {Vec512Reg},
+    MIRBuilder.buildInstr(TargetOpcode::G_INSERT_VECTOR_ELT, {Vec512Reg},
                           {VecUndef, SrcReg, IdxReg});
     return Vec512Reg;
   };
@@ -1349,8 +810,8 @@ bool AIELegalizerInfo::legalizeG_FCMP(LegalizerHelper &Helper, MachineInstr &MI,
   return true;
 }
 
-bool AIELegalizerInfo::legalizeG_FPTRUNC(LegalizerHelper &Helper,
-                                         MachineInstr &MI) const {
+bool AIELegalizerHelper::legalizeG_FPTRUNC(LegalizerHelper &Helper,
+                                           MachineInstr &MI) const {
   MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
   MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
 
@@ -1371,7 +832,7 @@ bool AIELegalizerInfo::legalizeG_FPTRUNC(LegalizerHelper &Helper,
   Register IdxReg = MRI.createGenericVirtualRegister(LLT::scalar(32));
   MIRBuilder.buildUndef(Vec512Undef);
   MIRBuilder.buildConstant(IdxReg, 0);
-  MIRBuilder.buildInstr(AIE2::G_INSERT_VECTOR_ELT, {Vec512Reg},
+  MIRBuilder.buildInstr(TargetOpcode::G_INSERT_VECTOR_ELT, {Vec512Reg},
                         {Vec512Undef, SrcReg, IdxReg});
 
   Register Acc512Reg = MRI.createGenericVirtualRegister(ACC512);
@@ -1379,7 +840,8 @@ bool AIELegalizerInfo::legalizeG_FPTRUNC(LegalizerHelper &Helper,
 
   Register Vec256Reg = MRI.createGenericVirtualRegister(V16S16);
   MIRBuilder
-      .buildIntrinsic(Intrinsic::aie2_v16accfloat_to_v16bf16, Vec256Reg, true, false)
+      .buildIntrinsic(Intrinsic::aie2_v16accfloat_to_v16bf16, Vec256Reg, true,
+                      false)
       .addUse(Acc512Reg);
 
   MIRBuilder.buildInstr(TargetOpcode::G_EXTRACT_VECTOR_ELT, {DstReg},
@@ -1388,8 +850,8 @@ bool AIELegalizerInfo::legalizeG_FPTRUNC(LegalizerHelper &Helper,
   return true;
 }
 
-bool AIELegalizerInfo::legalizeG_FPEXT(LegalizerHelper &Helper,
-                                       MachineInstr &MI) const {
+bool AIELegalizerHelper::legalizeG_FPEXT(LegalizerHelper &Helper,
+                                         MachineInstr &MI) const {
   MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
   MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
 
@@ -1413,8 +875,8 @@ bool AIELegalizerInfo::legalizeG_FPEXT(LegalizerHelper &Helper,
 }
 
 // Legalized by masking sign bit of both double and float
-bool AIELegalizerInfo::legalizeG_FABS(LegalizerHelper &Helper,
-                                      MachineInstr &MI) const {
+bool AIELegalizerHelper::legalizeG_FABS(LegalizerHelper &Helper,
+                                        MachineInstr &MI) const {
   MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
   MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
 
@@ -1447,8 +909,8 @@ bool AIELegalizerInfo::legalizeG_FABS(LegalizerHelper &Helper,
   return true;
 }
 
-bool AIELegalizerInfo::legalizeG_FADDSUB(LegalizerHelper &Helper,
-                                         MachineInstr &MI) const {
+bool AIELegalizerHelper::legalizeG_FADDSUB(LegalizerHelper &Helper,
+                                           MachineInstr &MI) const {
   MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
   MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
 
@@ -1470,14 +932,16 @@ bool AIELegalizerInfo::legalizeG_FADDSUB(LegalizerHelper &Helper,
   Register Src1Vec = MIRBuilder.buildUndef(V16FP32).getReg(0);
   Register Src2Vec = MIRBuilder.buildUndef(V16FP32).getReg(0);
 
-  Register NewSrc1 = MIRBuilder
-                         .buildInstr(AIE2::G_AIE_INSERT_VECTOR_ELT, {V16FP32},
-                                     {Src1Vec, NewSrcReg1, IdxReg})
-                         .getReg(0);
-  Register NewSrc2 = MIRBuilder
-                         .buildInstr(AIE2::G_AIE_INSERT_VECTOR_ELT, {V16FP32},
-                                     {Src2Vec, NewSrcReg2, IdxReg})
-                         .getReg(0);
+  const unsigned InsertEltOpc =
+      ST.getInstrInfo()->getGenericInsertVectorEltOpcode();
+  Register NewSrc1 =
+      MIRBuilder
+          .buildInstr(InsertEltOpc, {V16FP32}, {Src1Vec, NewSrcReg1, IdxReg})
+          .getReg(0);
+  Register NewSrc2 =
+      MIRBuilder
+          .buildInstr(InsertEltOpc, {V16FP32}, {Src2Vec, NewSrcReg2, IdxReg})
+          .getReg(0);
 
   Register FPOp;
   if (MI.getOpcode() == TargetOpcode::G_FADD)
@@ -1494,8 +958,9 @@ bool AIELegalizerInfo::legalizeG_FADDSUB(LegalizerHelper &Helper,
 
   const Register ExtEltDstReg = MRI.createGenericVirtualRegister(S32);
   const Register ExtDstReg = MRI.createGenericVirtualRegister(S32);
-  MIRBuilder.buildInstr(AIE2::G_AIE_SEXT_EXTRACT_VECTOR_ELT, {ExtEltDstReg},
-                        {Conv, IdxReg});
+  const unsigned ExtractEltOpc =
+      ST.getInstrInfo()->getGenericExtractVectorEltOpcode(/*SignExt*/ true);
+  MIRBuilder.buildInstr(ExtractEltOpc, {ExtEltDstReg}, {Conv, IdxReg});
   MIRBuilder.buildAssertInstr(TargetOpcode::G_ASSERT_SEXT, ExtDstReg,
                               ExtEltDstReg, 16);
   MIRBuilder.buildTrunc(DstReg, ExtDstReg);
@@ -1504,33 +969,24 @@ bool AIELegalizerInfo::legalizeG_FADDSUB(LegalizerHelper &Helper,
   return true;
 }
 
-bool AIELegalizerInfo::legalizeIntrinsic(LegalizerHelper &Helper,
-                                         MachineInstr &MI) const {
-
-  // The loop_decrement is a bit of an exception in legalization since it
-  // is an architecture-neutral intrinsic to implement hardware loops, not a
-  // dedicated AIE intrinsic. As such it carries a boolean, which should be
-  // legalized to a 32 bit integer type.
-  switch (cast<GIntrinsic>(MI).getIntrinsicID()) {
-  case Intrinsic::loop_decrement: {
-    assert(MI.getOpcode() == TargetOpcode::G_INTRINSIC_W_SIDE_EFFECTS);
-
-    MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
-    // Insert after our instruction
-    MIRBuilder.setInsertPt(*MI.getParent(), ++MI.getIterator());
-
-    Register OrigDst = MI.getOperand(0).getReg();
-    Register NewDst =
-        MIRBuilder.getMRI()->createGenericVirtualRegister(LLT::scalar(32));
-    // NOTE: we don't inform the observer about this change as we do not want to
-    // revisit this instruction
-    MI.getOperand(0).setReg(NewDst);
-    Register ZExtValueReg =
-        MIRBuilder.buildAssertZExt(LLT::scalar(32), NewDst, 1).getReg(0);
-    MIRBuilder.buildTrunc(OrigDst, ZExtValueReg);
-    return true;
-  }
-  }
+bool AIELegalizerHelper::legalizeLoopDecrement(LegalizerHelper &Helper,
+                                               MachineInstr &MI) const {
+  assert(MI.getOpcode() == TargetOpcode::G_INTRINSIC_W_SIDE_EFFECTS);
 
+  MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
+  // Insert after our instruction
+  MIRBuilder.setInsertPt(*MI.getParent(), ++MI.getIterator());
+
+  Register OrigDst = MI.getOperand(0).getReg();
+  Register NewDst =
+      MIRBuilder.getMRI()->createGenericVirtualRegister(LLT::scalar(32));
+  // NOTE: we don't inform the observer about this change as we do not want to
+  // revisit this instruction
+  MI.getOperand(0).setReg(NewDst);
+  Register ZExtValueReg =
+      MIRBuilder.buildAssertZExt(LLT::scalar(32), NewDst, 1).getReg(0);
+  MIRBuilder.buildTrunc(OrigDst, ZExtValueReg);
   return true;
 }
+
+} // namespace llvm
diff --git a/llvm/lib/Target/AIE/AIELegalizerInfo.h b/llvm/lib/Target/AIE/AIELegalizerHelper.h
similarity index 76%
rename from llvm/lib/Target/AIE/AIELegalizerInfo.h
rename to llvm/lib/Target/AIE/AIELegalizerHelper.h
index f367eb700d21..91e0f08e6517 100644
--- a/llvm/lib/Target/AIE/AIELegalizerInfo.h
+++ b/llvm/lib/Target/AIE/AIELegalizerHelper.h
@@ -1,4 +1,4 @@
-//===- AIELegalizerInfo -----------------------------------------*- C++ -*-===//
+//===- AIELegalizerHelper.h -------------------------------------*- C++ -*-===//
 //
 // This file is licensed under the Apache License v2.0 with LLVM Exceptions.
 // See https://llvm.org/LICENSE.txt for license information.
@@ -8,31 +8,28 @@
 //
 //===----------------------------------------------------------------------===//
 /// \file
-/// This file declares the targeting of the Machinelegalizer class for AIE.
-/// \todo This should be generated by TableGen.
+/// This file implements AIE specific legalization functions
 //===----------------------------------------------------------------------===//
 
-#ifndef LLVM_LIB_TARGET_AIE_AIEMACHINELEGALIZER_H
-#define LLVM_LIB_TARGET_AIE_AIEMACHINELEGALIZER_H
+#ifndef LLVM_LIB_TARGET_AIE_AIELEGALIZERHELPER_H
+#define LLVM_LIB_TARGET_AIE_AIELEGALIZERHELPER_H
 
-#include "llvm/CodeGen/GlobalISel/LegalizerInfo.h"
-#include "llvm/CodeGen/Register.h"
+#include "llvm/CodeGen/GlobalISel/LegalizerHelper.h"
 #include "llvm/IR/InstrTypes.h"
 
 namespace llvm {
-
+struct AIEBaseInstrInfo;
 class AIEBaseSubtarget;
+class LegalizerHelper;
+class MachineInstr;
+
+class AIELegalizerHelper {
+  const AIEBaseSubtarget &ST;
 
-/// This class provides legalization strategies.
-class AIELegalizerInfo : public LegalizerInfo {
 public:
-  AIELegalizerInfo(const AIEBaseSubtarget &ST);
-  bool legalizeCustom(LegalizerHelper &Helper, MachineInstr &MI,
-                      LostDebugLocObserver &LocObserver) const override;
-  bool legalizeIntrinsic(LegalizerHelper &Helper,
-                         MachineInstr &MI) const override;
+  AIELegalizerHelper(const AIEBaseSubtarget &ST);
+  const AIEBaseInstrInfo *getInstrInfo();
 
-private:
   bool legalizeG_VASTART(LegalizerHelper &Helper, MachineInstr &MI) const;
   bool legalizeG_BUILD_VECTOR(LegalizerHelper &Helper, MachineInstr &MI) const;
   bool legalizeG_UNMERGE_VALUES(LegalizerHelper &Helper,
@@ -59,6 +56,7 @@ class AIELegalizerInfo : public LegalizerInfo {
   bool legalizeG_FPEXT(LegalizerHelper &Helper, MachineInstr &MI) const;
   bool legalizeG_FABS(LegalizerHelper &Helper, MachineInstr &MI) const;
   bool legalizeG_FADDSUB(LegalizerHelper &Helper, MachineInstr &MI) const;
+  bool legalizeLoopDecrement(LegalizerHelper &Helper, MachineInstr &MI) const;
 
   // Helper functions for legalization
   bool pack32BitVector(LegalizerHelper &Helper, MachineInstr &MI,
@@ -66,5 +64,7 @@ class AIELegalizerInfo : public LegalizerInfo {
   bool unpack32BitVector(LegalizerHelper &Helper, MachineInstr &MI,
                          Register SourceReg) const;
 };
-} // end namespace llvm
-#endif
+
+} // namespace llvm
+
+#endif // LLVM_LIB_TARGET_AIE_AIELEGALIZERHELPER_H
diff --git a/llvm/lib/Target/AIE/AIESubtarget.cpp b/llvm/lib/Target/AIE/AIESubtarget.cpp
index f98a5b02e9f2..cb965d73c2e7 100644
--- a/llvm/lib/Target/AIE/AIESubtarget.cpp
+++ b/llvm/lib/Target/AIE/AIESubtarget.cpp
@@ -14,10 +14,10 @@
 
 #include "AIESubtarget.h"
 #include "AIE.h"
+#include "AIE1LegalizerInfo.h"
 #include "AIE1RegisterBankInfo.h"
 #include "AIECallLowering.h"
 #include "AIEFrameLowering.h"
-#include "AIELegalizerInfo.h"
 #include "AIETargetMachine.h"
 #include "llvm/CodeGen/ScheduleDAG.h"
 #include "llvm/MC/TargetRegistry.h"
@@ -52,7 +52,7 @@ AIESubtarget::AIESubtarget(const Triple &TT, StringRef CPU, StringRef TuneCPU,
                     << ABIName << "\n");
 
   CallLoweringInfo.reset(new AIECallLowering(*getTargetLowering()));
-  Legalizer.reset(new AIELegalizerInfo(*this));
+  Legalizer.reset(new AIE1LegalizerInfo(*this));
 
   auto *RBI = new AIE1RegisterBankInfo(*getRegisterInfo());
   RegBankInfo.reset(RBI);
diff --git a/llvm/lib/Target/AIE/CMakeLists.txt b/llvm/lib/Target/AIE/CMakeLists.txt
index b0b66138b7bc..dc16237757b5 100644
--- a/llvm/lib/Target/AIE/CMakeLists.txt
+++ b/llvm/lib/Target/AIE/CMakeLists.txt
@@ -77,7 +77,8 @@ add_llvm_target(AIECodeGen
    AIEInstructionSelector.cpp
    AIEInterBlockScheduling.cpp
    AIEISelDAGToDAG.cpp
-   AIELegalizerInfo.cpp
+   AIELegalizerHelper.cpp
+   AIE1LegalizerInfo.cpp
    AIELiveRegs.cpp
    AIEMachineAlignment.cpp
    AIEMachineBlockPlacement.cpp