From 386aa7200324519ea9a8eff5eb1b3c0517756d24 Mon Sep 17 00:00:00 2001
From: Mengwei Liu <larryliu@meta.com>
Date: Fri, 6 Jun 2025 13:56:43 -0700
Subject: [PATCH] [BE] Cleanup old ExecuTorch codegen and runtime code
 (#154165)

Summary: These files are added to pytorch/pytorch before ExecuTorch is
opensourced. Now is a good time to remove it from pytorch/pytorch, since
the code is moved to pytorch/executorch already.

Test Plan: Rely on CI jobs.

Differential Revision: [D75985423](https://our.internmc.facebook.com/intern/diff/D75985423)
Pull Request resolved: https://github.com/pytorch/pytorch/pull/154165
Approved by: https://github.com/kimishpatel, https://github.com/Skylion007, https://github.com/cyyever
---
 .ci/docker/ci_commit_pins/executorch.txt      |    2 +-
 .ci/pytorch/build.sh                          |    6 -
 CMakeLists.txt                                |    1 -
 caffe2/CMakeLists.txt                         |    6 -
 pyproject.toml                                |    4 -
 setup.py                                      |    2 -
 test/edge/CMakeLists.txt                      |   74 --
 test/edge/Evalue.h                            |  479 --------
 test/edge/custom_ops.cpp                      |   10 -
 test/edge/custom_ops.yaml                     |    4 -
 test/edge/event_tracer.h                      |   33 -
 test/edge/event_tracer_hooks.h                |   91 --
 test/edge/kernel_runtime_context.h            |   44 -
 test/edge/operator_registry.cpp               |   45 -
 test/edge/operator_registry.h                 |   72 --
 test/edge/selected_operators.yaml             |  463 --------
 test/edge/templates/Functions.h               |   25 -
 test/edge/templates/NativeFunctions.h         |   31 -
 .../RegisterCodegenUnboxedKernels.cpp         |   28 -
 .../RegisterDispatchKeyCustomOps.cpp          |   27 -
 test/edge/templates/RegisterKernels.h         |   22 -
 test/edge/templates/RegisterSchema.cpp        |   10 -
 test/edge/test_main.cpp                       |   18 -
 test/edge/test_operator_registration.cpp      |   53 -
 tools/BUCK.bzl                                |   15 -
 tools/test/test_executorch_custom_ops.py      |  147 ---
 tools/test/test_executorch_gen.py             |  689 -----------
 tools/test/test_executorch_signatures.py      |   59 -
 tools/test/test_executorch_types.py           |  114 --
 tools/test/test_executorch_unboxing.py        |  176 ---
 tools/test/test_selective_build.py            |   42 -
 torchgen/build.bzl                            |   10 -
 torchgen/executorch/__init__.py               |    0
 torchgen/executorch/api/__init__.py           |    0
 torchgen/executorch/api/custom_ops.py         |  151 ---
 torchgen/executorch/api/et_cpp.py             |  367 ------
 torchgen/executorch/api/types/__init__.py     |    4 -
 torchgen/executorch/api/types/signatures.py   |   76 --
 torchgen/executorch/api/types/types.py        |   77 --
 torchgen/executorch/api/unboxing.py           |  218 ----
 torchgen/executorch/model.py                  |  220 ----
 torchgen/executorch/parse.py                  |  153 ---
 torchgen/gen_executorch.py                    | 1024 -----------------
 43 files changed, 1 insertion(+), 5091 deletions(-)
 delete mode 100644 test/edge/CMakeLists.txt
 delete mode 100644 test/edge/Evalue.h
 delete mode 100644 test/edge/custom_ops.cpp
 delete mode 100644 test/edge/custom_ops.yaml
 delete mode 100644 test/edge/event_tracer.h
 delete mode 100644 test/edge/event_tracer_hooks.h
 delete mode 100644 test/edge/kernel_runtime_context.h
 delete mode 100644 test/edge/operator_registry.cpp
 delete mode 100644 test/edge/operator_registry.h
 delete mode 100644 test/edge/selected_operators.yaml
 delete mode 100644 test/edge/templates/Functions.h
 delete mode 100644 test/edge/templates/NativeFunctions.h
 delete mode 100644 test/edge/templates/RegisterCodegenUnboxedKernels.cpp
 delete mode 100644 test/edge/templates/RegisterDispatchKeyCustomOps.cpp
 delete mode 100644 test/edge/templates/RegisterKernels.h
 delete mode 100644 test/edge/templates/RegisterSchema.cpp
 delete mode 100644 test/edge/test_main.cpp
 delete mode 100644 test/edge/test_operator_registration.cpp
 delete mode 100644 tools/test/test_executorch_custom_ops.py
 delete mode 100644 tools/test/test_executorch_gen.py
 delete mode 100644 tools/test/test_executorch_signatures.py
 delete mode 100644 tools/test/test_executorch_types.py
 delete mode 100644 tools/test/test_executorch_unboxing.py
 delete mode 100644 torchgen/executorch/__init__.py
 delete mode 100644 torchgen/executorch/api/__init__.py
 delete mode 100644 torchgen/executorch/api/custom_ops.py
 delete mode 100644 torchgen/executorch/api/et_cpp.py
 delete mode 100644 torchgen/executorch/api/types/__init__.py
 delete mode 100644 torchgen/executorch/api/types/signatures.py
 delete mode 100644 torchgen/executorch/api/types/types.py
 delete mode 100644 torchgen/executorch/api/unboxing.py
 delete mode 100644 torchgen/executorch/model.py
 delete mode 100644 torchgen/executorch/parse.py
 delete mode 100644 torchgen/gen_executorch.py

diff --git a/.ci/docker/ci_commit_pins/executorch.txt b/.ci/docker/ci_commit_pins/executorch.txt
index ce68b499a8f..248de66edbc 100644
--- a/.ci/docker/ci_commit_pins/executorch.txt
+++ b/.ci/docker/ci_commit_pins/executorch.txt
@@ -1 +1 @@
-b173722085b3f555d6ba4533d6bbaddfd7c71144
+f50bfa92602b45dca884a9e511e5d9ddbe8ba314
diff --git a/.ci/pytorch/build.sh b/.ci/pytorch/build.sh
index 2bcfe9f02b0..979b423d646 100755
--- a/.ci/pytorch/build.sh
+++ b/.ci/pytorch/build.sh
@@ -52,12 +52,6 @@ fi
 export USE_LLVM=/opt/llvm
 export LLVM_DIR=/opt/llvm/lib/cmake/llvm
 
-if [[ "$BUILD_ENVIRONMENT" == *executorch* ]]; then
-  # To build test_edge_op_registration
-  export BUILD_EXECUTORCH=ON
-  export USE_CUDA=0
-fi
-
 if ! which conda; then
   # In ROCm CIs, we are doing cross compilation on build machines with
   # intel cpu and later run tests on machines with amd cpu.
diff --git a/CMakeLists.txt b/CMakeLists.txt
index dda9a511d95..95172f2166a 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -528,7 +528,6 @@ if(USE_LIGHTWEIGHT_DISPATCH AND NOT STATIC_DISPATCH_BACKEND)
 endif()
 option(TRACING_BASED
        "Master flag to build Lite Interpreter with tracing build option" OFF)
-option(BUILD_EXECUTORCH "Master flag to build Executorch" ON)
 # This is a fix for a rare build issue on Ubuntu: symbol lookup error:
 # miniconda3/envs/pytorch-py3.7/lib/libmkl_intel_lp64.so: undefined symbol:
 # mkl_blas_dsyrk
diff --git a/caffe2/CMakeLists.txt b/caffe2/CMakeLists.txt
index a83aeff378c..6e9127215b2 100644
--- a/caffe2/CMakeLists.txt
+++ b/caffe2/CMakeLists.txt
@@ -1317,12 +1317,6 @@ install(FILES
   "${TORCH_SRC_DIR}/custom_class_detail.h"
   DESTINATION ${TORCH_INSTALL_INCLUDE_DIR}/torch)
 if(BUILD_TEST)
-  if(BUILD_EXECUTORCH)
-    add_subdirectory(
-            ${TORCH_ROOT}/test/edge
-            ${CMAKE_BINARY_DIR}/test_edge_op_registration
-    )
-  endif()
   if(BUILD_LITE_INTERPRETER)
     add_subdirectory(
       ${TORCH_ROOT}/test/cpp/lite_interpreter_runtime
diff --git a/pyproject.toml b/pyproject.toml
index 054eb4d6ecb..2e18f53163b 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -272,10 +272,6 @@ select = [
     "F401",
     "F403",
 ]
-"torchgen/executorch/api/types/__init__.py" = [
-    "F401",
-    "F403",
-]
 "torch/utils/collect_env.py" = [
     "UP", # collect_env.py needs to work with older versions of Python
 ]
diff --git a/setup.py b/setup.py
index 9ee5600be12..30e0da7b5c9 100644
--- a/setup.py
+++ b/setup.py
@@ -699,8 +699,6 @@ class build_ext(setuptools.command.build_ext.build_ext):
             )
         if cmake_cache_vars["USE_LIGHTWEIGHT_DISPATCH"]:
             report("-- Using lightweight dispatch")
-        if cmake_cache_vars["BUILD_EXECUTORCH"]:
-            report("-- Building Executorch")
 
         if cmake_cache_vars["USE_ITT"]:
             report("-- Using ITT")
diff --git a/test/edge/CMakeLists.txt b/test/edge/CMakeLists.txt
deleted file mode 100644
index 985b7720248..00000000000
--- a/test/edge/CMakeLists.txt
+++ /dev/null
@@ -1,74 +0,0 @@
-cmake_minimum_required(VERSION 3.15)
-
-set(TORCH_ROOT ${CMAKE_CURRENT_LIST_DIR}/../..)
-set(TEST_ROOT ${TORCH_ROOT}/test/edge)
-set(OUTPUT_DIRECTORY ${CMAKE_BINARY_DIR}/out)
-file(GLOB_RECURSE all_python "${TORCH_ROOT}/torchgen/*.py")
-include(${TORCH_ROOT}/cmake/public/utils.cmake)
-append_cxx_flag_if_supported("-Wno-unused-private-field" CMAKE_CXX_FLAGS)
-
-# Generate unboxing kernels
-set(GEN_COMMAND
-        Python::Interpreter -m torchgen.gen_executorch
-        --source-path=${TEST_ROOT}
-        --install-dir=${OUTPUT_DIRECTORY}
-        --tags-path=${TORCH_ROOT}/aten/src/ATen/native/tags.yaml
-        --aten-yaml-path=${TORCH_ROOT}/aten/src/ATen/native/native_functions.yaml
-        --use-aten-lib
-        --op-selection-yaml-path=${TEST_ROOT}/selected_operators.yaml
-        --custom-ops-yaml-path=${TEST_ROOT}/custom_ops.yaml
-        )
-set(GEN_COMMAND_sources
-        ${OUTPUT_DIRECTORY}/RegisterCodegenUnboxedKernelsEverything.cpp
-        ${OUTPUT_DIRECTORY}/RegisterCPUCustomOps.cpp
-        ${OUTPUT_DIRECTORY}/Functions.h
-        ${OUTPUT_DIRECTORY}/NativeFunctions.h
-        ${OUTPUT_DIRECTORY}/CustomOpsNativeFunctions.h
-        )
-message(STATUS "Generating sources for unboxing kernels ${GEN_COMMAND}")
-add_custom_command(
-        COMMENT "Generating sources"
-        OUTPUT ${GEN_COMMAND_sources}
-        COMMAND ${GEN_COMMAND}
-        DEPENDS
-        ${all_python}
-        ${TORCH_ROOT}/aten/src/ATen/native/native_functions.yaml
-        ${TORCH_ROOT}/aten/src/ATen/native/tags.yaml
-        ${TEST_ROOT}/templates/Functions.h
-        ${TEST_ROOT}/templates/NativeFunctions.h
-        ${TEST_ROOT}/templates/RegisterCodegenUnboxedKernels.cpp
-        ${TEST_ROOT}/templates/RegisterDispatchKeyCustomOps.cpp
-        WORKING_DIRECTORY ${TORCH_ROOT}
-)
-add_custom_target(unbox_target DEPENDS ${GEN_COMMAND_sources})
-
-add_library(unbox_lib STATIC
-        ${GEN_COMMAND_sources}
-        ${TEST_ROOT}/operator_registry.cpp
-        ${TEST_ROOT}/custom_ops.cpp
-        )
-target_include_directories(unbox_lib PUBLIC ${TEST_ROOT} ${ATen_CPU_INCLUDE})
-target_link_libraries(unbox_lib PUBLIC torch_cpu)
-target_compile_definitions(unbox_lib PUBLIC USE_ATEN_LIB)
-
-add_executable(test_edge_op_registration
-        ${TEST_ROOT}/test_operator_registration.cpp
-        ${TEST_ROOT}/test_main.cpp
-        )
-
-target_compile_definitions(test_edge_op_registration PRIVATE USE_GTEST)
-
-target_link_libraries(test_edge_op_registration PRIVATE gtest_main unbox_lib)
-if((CMAKE_CXX_COMPILER_ID MATCHES "AppleClang") OR (APPLE AND CMAKE_CXX_COMPILER_ID MATCHES "Clang"))
-  target_link_options(test_edge_op_registration PRIVATE
-          "-Wl,-force_load,$<TARGET_FILE:unbox_lib>"
-          )
-elseif(CMAKE_CXX_COMPILER_ID MATCHES "Clang|GNU")
-  target_link_options(test_edge_op_registration PRIVATE
-          "-Wl,--whole-archive,$<TARGET_FILE:unbox_lib>,--no-whole-archive"
-          )
-endif()
-if(INSTALL_TEST)
-  set_target_properties(test_edge_op_registration PROPERTIES INSTALL_RPATH "${CMAKE_INSTALL_RPATH}:${_rpath_portable_origin}/../lib")
-  install(TARGETS test_edge_op_registration DESTINATION bin)
-endif()
diff --git a/test/edge/Evalue.h b/test/edge/Evalue.h
deleted file mode 100644
index 7038a7bdaa6..00000000000
--- a/test/edge/Evalue.h
+++ /dev/null
@@ -1,479 +0,0 @@
-#pragma once
-
-#include <ATen/ATen.h>
-/**
- * WARNING: EValue is a class used by Executorch, for its boxed operators. It
- * contains similar logic as `IValue` in PyTorch, by providing APIs to convert
- * boxed values to unboxed values.
- *
- * It's mirroring a fbcode internal source file
- * [`EValue.h`](https://www.internalfb.com/code/fbsource/xplat/executorch/core/values/Evalue.h).
- *
- * The reason why we are mirroring this class, is to make sure we have CI job
- * coverage on torchgen logic, given that torchgen is used for both Executorch
- * and PyTorch.
- *
- * If any of the logic here needs to be changed, please update fbcode version of
- * `Evalue.h` as well. These two versions will be merged as soon as Executorch
- * is in OSS (hopefully by Q2 2023).
- */
-namespace torch {
-namespace executor {
-
-#define ET_CHECK_MSG TORCH_CHECK_MSG
-#define EXECUTORCH_FORALL_TAGS(_) \
-  _(None)                         \
-  _(Tensor)                       \
-  _(String)                       \
-  _(Double)                       \
-  _(Int)                          \
-  _(Bool)                         \
-  _(ListBool)                     \
-  _(ListDouble)                   \
-  _(ListInt)                      \
-  _(ListTensor)                   \
-  _(ListScalar)                   \
-  _(ListOptionalTensor)
-
-enum class Tag : uint32_t {
-#define DEFINE_TAG(x) x,
-  EXECUTORCH_FORALL_TAGS(DEFINE_TAG)
-#undef DEFINE_TAG
-};
-
-struct EValue;
-
-template <typename T>
-struct evalue_to_const_ref_overload_return {
-  using type = T;
-};
-
-template <>
-struct evalue_to_const_ref_overload_return<at::Tensor> {
-  using type = const at::Tensor&;
-};
-
-template <typename T>
-struct evalue_to_ref_overload_return {
-  using type = T;
-};
-
-template <>
-struct evalue_to_ref_overload_return<at::Tensor> {
-  using type = at::Tensor&;
-};
-
-/*
- * Helper class used to correlate EValues in the executor table, with the
- * unwrapped list of the proper type. Because values in the runtime's values
- * table can change during execution, we cannot statically allocate list of
- * objects at deserialization. Imagine the serialized list says index 0 in the
- * value table is element 2 in the list, but during execution the value in
- * element 2 changes (in the case of tensor this means the TensorImpl* stored in
- * the tensor changes). To solve this instead they must be created dynamically
- * whenever they are used.
- */
-template <typename T>
-class EValObjectList {
- public:
-  EValObjectList() = default;
-  /*
-   * Wrapped_vals is a list of pointers into the values table of the runtime
-   * whose destinations correlate with the elements of the list, unwrapped_vals
-   * is a container of the same size whose serves as memory to construct the
-   * unwrapped vals.
-   */
-  EValObjectList(EValue** wrapped_vals, T* unwrapped_vals, int size)
-      : wrapped_vals_(wrapped_vals, size), unwrapped_vals_(unwrapped_vals) {}
-  /*
-   * Constructs and returns the list of T specified by the EValue pointers
-   */
-  at::ArrayRef<T> get() const;
-
- private:
-  // Source of truth for the list
-  at::ArrayRef<EValue*> wrapped_vals_;
-  // Same size as wrapped_vals
-  mutable T* unwrapped_vals_;
-};
-
-// Aggregate typing system similar to IValue only slimmed down with less
-// functionality, no dependencies on atomic, and fewer supported types to better
-// suit embedded systems (ie no intrusive ptr)
-struct EValue {
-  union Payload {
-    // When in ATen mode at::Tensor is not trivially copyable, this nested union
-    // lets us handle tensor as a special case while leaving the rest of the
-    // fields in a simple state instead of requiring a switch on tag everywhere.
-    union TriviallyCopyablePayload {
-      TriviallyCopyablePayload() : as_int(0) {}
-      // Scalar supported through these 3 types
-      int64_t as_int;
-      double as_double;
-      bool as_bool;
-      // TODO(jakeszwe): convert back to pointers to optimize size of this
-      // struct
-      at::ArrayRef<char> as_string;
-      at::ArrayRef<int64_t> as_int_list;
-      at::ArrayRef<double> as_double_list;
-      at::ArrayRef<bool> as_bool_list;
-      EValObjectList<at::Tensor> as_tensor_list;
-      EValObjectList<std::optional<at::Tensor>> as_list_optional_tensor;
-    } copyable_union;
-
-    // Since a Tensor just holds a TensorImpl*, there's no value to use Tensor*
-    // here.
-    at::Tensor as_tensor;
-
-    Payload() {}
-    ~Payload() {}
-  };
-
-  // Data storage and type tag
-  Payload payload;
-  Tag tag;
-
-  // Basic ctors and assignments
-  EValue(const EValue& rhs) : EValue(rhs.payload, rhs.tag) {}
-
-  EValue(EValue&& rhs) noexcept : tag(rhs.tag) {
-    moveFrom(std::move(rhs));
-  }
-
-  EValue& operator=(EValue&& rhs) & noexcept {
-    if (&rhs == this) {
-      return *this;
-    }
-
-    destroy();
-    moveFrom(std::move(rhs));
-    return *this;
-  }
-
-  EValue& operator=(EValue const& rhs) & {
-    // Define copy assignment through copy ctor and move assignment
-    *this = EValue(rhs);
-    return *this;
-  }
-
-  ~EValue() {
-    destroy();
-  }
-
-  /****** None Type ******/
-  EValue() : tag(Tag::None) {
-    payload.copyable_union.as_int = 0;
-  }
-
-  bool isNone() const {
-    return tag == Tag::None;
-  }
-
-  /****** Int Type ******/
-  /*implicit*/ EValue(int64_t i) : tag(Tag::Int) {
-    payload.copyable_union.as_int = i;
-  }
-
-  bool isInt() const {
-    return tag == Tag::Int;
-  }
-
-  int64_t toInt() const {
-    ET_CHECK_MSG(isInt(), "EValue is not an int.");
-    return payload.copyable_union.as_int;
-  }
-
-  /****** Double Type ******/
-  /*implicit*/ EValue(double d) : tag(Tag::Double) {
-    payload.copyable_union.as_double = d;
-  }
-
-  bool isDouble() const {
-    return tag == Tag::Double;
-  }
-
-  double toDouble() const {
-    ET_CHECK_MSG(isDouble(), "EValue is not a Double.");
-    return payload.copyable_union.as_double;
-  }
-
-  /****** Bool Type ******/
-  /*implicit*/ EValue(bool b) : tag(Tag::Bool) {
-    payload.copyable_union.as_bool = b;
-  }
-
-  bool isBool() const {
-    return tag == Tag::Bool;
-  }
-
-  bool toBool() const {
-    ET_CHECK_MSG(isBool(), "EValue is not a Bool.");
-    return payload.copyable_union.as_bool;
-  }
-
-  /****** Scalar Type ******/
-  /// Construct an EValue using the implicit value of a Scalar.
-  /*implicit*/ EValue(at::Scalar s) {
-    if (s.isIntegral(false)) {
-      tag = Tag::Int;
-      payload.copyable_union.as_int = s.to<int64_t>();
-    } else if (s.isFloatingPoint()) {
-      tag = Tag::Double;
-      payload.copyable_union.as_double = s.to<double>();
-    } else if (s.isBoolean()) {
-      tag = Tag::Bool;
-      payload.copyable_union.as_bool = s.to<bool>();
-    } else {
-      ET_CHECK_MSG(false, "Scalar passed to EValue is not initialized.");
-    }
-  }
-
-  bool isScalar() const {
-    return tag == Tag::Int || tag == Tag::Double || tag == Tag::Bool;
-  }
-
-  at::Scalar toScalar() const {
-    // Convert from implicit value to Scalar using implicit constructors.
-
-    if (isDouble()) {
-      return toDouble();
-    } else if (isInt()) {
-      return toInt();
-    } else if (isBool()) {
-      return toBool();
-    } else {
-      ET_CHECK_MSG(false, "EValue is not a Scalar.");
-      return c10::Scalar();
-    }
-  }
-
-  /****** Tensor Type ******/
-  /*implicit*/ EValue(at::Tensor t) : tag(Tag::Tensor) {
-    // When built in aten mode, at::Tensor has a non trivial constructor
-    // destructor, so regular assignment to a union field is UB. Instead we must
-    // go through placement new (which causes a refcount bump).
-    new (&payload.as_tensor) at::Tensor(t);
-  }
-
-  bool isTensor() const {
-    return tag == Tag::Tensor;
-  }
-
-  at::Tensor toTensor() && {
-    ET_CHECK_MSG(isTensor(), "EValue is not a Tensor.");
-    return std::move(payload.as_tensor);
-  }
-
-  at::Tensor& toTensor() & {
-    ET_CHECK_MSG(isTensor(), "EValue is not a Tensor.");
-    return payload.as_tensor;
-  }
-
-  const at::Tensor& toTensor() const& {
-    ET_CHECK_MSG(isTensor(), "EValue is not a Tensor.");
-    return payload.as_tensor;
-  }
-
-  /****** String Type ******/
-  /*implicit*/ EValue(const char* s, size_t size) : tag(Tag::String) {
-    payload.copyable_union.as_string = at::ArrayRef<char>(s, size);
-  }
-
-  bool isString() const {
-    return tag == Tag::String;
-  }
-
-  std::string_view toString() const {
-    ET_CHECK_MSG(isString(), "EValue is not a String.");
-    return std::string_view(
-        payload.copyable_union.as_string.data(),
-        payload.copyable_union.as_string.size());
-  }
-
-  /****** Int List Type ******/
-  /*implicit*/ EValue(at::ArrayRef<int64_t> i) : tag(Tag::ListInt) {
-    payload.copyable_union.as_int_list = i;
-  }
-
-  bool isIntList() const {
-    return tag == Tag::ListInt;
-  }
-
-  at::ArrayRef<int64_t> toIntList() const {
-    ET_CHECK_MSG(isIntList(), "EValue is not an Int List.");
-    return payload.copyable_union.as_int_list;
-  }
-
-  /****** Bool List Type ******/
-  /*implicit*/ EValue(at::ArrayRef<bool> b) : tag(Tag::ListBool) {
-    payload.copyable_union.as_bool_list = b;
-  }
-
-  bool isBoolList() const {
-    return tag == Tag::ListBool;
-  }
-
-  at::ArrayRef<bool> toBoolList() const {
-    ET_CHECK_MSG(isBoolList(), "EValue is not a Bool List.");
-    return payload.copyable_union.as_bool_list;
-  }
-
-  /****** Double List Type ******/
-  /*implicit*/ EValue(at::ArrayRef<double> d) : tag(Tag::ListDouble) {
-    payload.copyable_union.as_double_list = d;
-  }
-
-  bool isDoubleList() const {
-    return tag == Tag::ListDouble;
-  }
-
-  at::ArrayRef<double> toDoubleList() const {
-    ET_CHECK_MSG(isDoubleList(), "EValue is not a Double List.");
-    return payload.copyable_union.as_double_list;
-  }
-
-  /****** Tensor List Type ******/
-  /*implicit*/ EValue(EValObjectList<at::Tensor> t) : tag(Tag::ListTensor) {
-    payload.copyable_union.as_tensor_list = t;
-  }
-
-  bool isTensorList() const {
-    return tag == Tag::ListTensor;
-  }
-
-  at::ArrayRef<at::Tensor> toTensorList() const {
-    ET_CHECK_MSG(isTensorList(), "EValue is not a Tensor List.");
-    return payload.copyable_union.as_tensor_list.get();
-  }
-
-  /****** List Optional Tensor Type ******/
-  /*implicit*/ EValue(EValObjectList<std::optional<at::Tensor>> t)
-      : tag(Tag::ListOptionalTensor) {
-    payload.copyable_union.as_list_optional_tensor = t;
-  }
-
-  bool isListOptionalTensor() const {
-    return tag == Tag::ListOptionalTensor;
-  }
-
-  at::ArrayRef<std::optional<at::Tensor>> toListOptionalTensor() {
-    return payload.copyable_union.as_list_optional_tensor.get();
-  }
-
-  /****** ScalarType Type ******/
-  at::ScalarType toScalarType() const {
-    ET_CHECK_MSG(isInt(), "EValue is not a ScalarType.");
-    return static_cast<at::ScalarType>(payload.copyable_union.as_int);
-  }
-
-  /****** MemoryFormat Type ******/
-  at::MemoryFormat toMemoryFormat() const {
-    ET_CHECK_MSG(isInt(), "EValue is not a MemoryFormat.");
-    return static_cast<at::MemoryFormat>(payload.copyable_union.as_int);
-  }
-
-  template <typename T>
-  T to() &&;
-
-  template <typename T>
-  typename evalue_to_ref_overload_return<T>::type to() &;
-
-  /**
-   * Converts the EValue to an optional object that can represent both T and
-   * an uninitialized state.
-   */
-  template <typename T>
-  inline std::optional<T> toOptional() {
-    if (this->isNone()) {
-      return std::nullopt;
-    }
-    return this->to<T>();
-  }
-
- private:
-  // Pre cond: the payload value has had its destructor called
-  void clearToNone() noexcept {
-    payload.copyable_union.as_int = 0;
-    tag = Tag::None;
-  }
-
-  // Shared move logic
-  void moveFrom(EValue&& rhs) noexcept {
-    if (rhs.isTensor()) {
-      new (&payload.as_tensor) at::Tensor(std::move(rhs.payload.as_tensor));
-      rhs.payload.as_tensor.~Tensor();
-    } else {
-      payload.copyable_union = rhs.payload.copyable_union;
-    }
-    tag = rhs.tag;
-    rhs.clearToNone();
-  }
-
-  // Destructs stored tensor if there is one
-  void destroy() {
-    // Necessary for ATen tensor to refcount decrement the intrusive_ptr to
-    // tensorimpl that got a refcount increment when we placed it in the evalue,
-    // no-op if executorch tensor #ifdef could have a
-    // minor performance bump for a code maintainability hit
-    if (isTensor()) {
-      payload.as_tensor.~Tensor();
-    } else if (isTensorList()) {
-      for (auto& tensor : toTensorList()) {
-        tensor.~Tensor();
-      }
-    } else if (isListOptionalTensor()) {
-      for (auto& optional_tensor : toListOptionalTensor()) {
-        optional_tensor.~optional();
-      }
-    }
-  }
-
-  EValue(const Payload& p, Tag t) : tag(t) {
-    if (isTensor()) {
-      new (&payload.as_tensor) at::Tensor(p.as_tensor);
-    } else {
-      payload.copyable_union = p.copyable_union;
-    }
-  }
-};
-
-#define EVALUE_DEFINE_TO(T, method_name)                           \
-  template <>                                                      \
-  inline evalue_to_ref_overload_return<T>::type EValue::to<T>()& { \
-    return static_cast<T>(this->method_name());                    \
-  }
-
-template <>
-inline at::Tensor& EValue::to<at::Tensor>() & {
-  return this->toTensor();
-}
-
-EVALUE_DEFINE_TO(at::Scalar, toScalar)
-EVALUE_DEFINE_TO(int64_t, toInt)
-EVALUE_DEFINE_TO(bool, toBool)
-EVALUE_DEFINE_TO(double, toDouble)
-EVALUE_DEFINE_TO(std::string_view, toString)
-EVALUE_DEFINE_TO(at::ScalarType, toScalarType)
-EVALUE_DEFINE_TO(at::MemoryFormat, toMemoryFormat)
-EVALUE_DEFINE_TO(std::optional<at::Tensor>, toOptional<at::Tensor>)
-EVALUE_DEFINE_TO(at::ArrayRef<int64_t>, toIntList)
-EVALUE_DEFINE_TO(
-    std::optional<at::ArrayRef<int64_t>>,
-    toOptional<at::ArrayRef<int64_t>>)
-EVALUE_DEFINE_TO(
-    std::optional<at::ArrayRef<double>>,
-    toOptional<at::ArrayRef<double>>)
-EVALUE_DEFINE_TO(at::ArrayRef<std::optional<at::Tensor>>, toListOptionalTensor)
-EVALUE_DEFINE_TO(at::ArrayRef<double>, toDoubleList)
-#undef EVALUE_DEFINE_TO
-
-template <typename T>
-at::ArrayRef<T> EValObjectList<T>::get() const {
-  for (size_t i = 0; i < wrapped_vals_.size(); i++) {
-    unwrapped_vals_[i] = wrapped_vals_[i]->template to<T>();
-  }
-  return at::ArrayRef<T>{unwrapped_vals_, wrapped_vals_.size()};
-}
-
-} // namespace executor
-} // namespace torch
diff --git a/test/edge/custom_ops.cpp b/test/edge/custom_ops.cpp
deleted file mode 100644
index cce09841127..00000000000
--- a/test/edge/custom_ops.cpp
+++ /dev/null
@@ -1,10 +0,0 @@
-#include <ATen/Tensor.h>
-
-namespace custom {
-namespace native {
-at::Tensor& add_3_out(const at::Tensor& a, const at::Tensor& b, const at::Tensor& c, at::Tensor& out) {
-    out = a.add(b).add(c);
-    return out;
-}
-}
-}
diff --git a/test/edge/custom_ops.yaml b/test/edge/custom_ops.yaml
deleted file mode 100644
index 2ff2db88f97..00000000000
--- a/test/edge/custom_ops.yaml
+++ /dev/null
@@ -1,4 +0,0 @@
-- func: custom::add_3.out(Tensor a, Tensor b, Tensor c, *, Tensor(a!) out) -> Tensor(a!)
-  kernels:
-    - arg_meta: null
-      kernel_name: custom::add_3_out
diff --git a/test/edge/event_tracer.h b/test/edge/event_tracer.h
deleted file mode 100644
index 9a62df3f522..00000000000
--- a/test/edge/event_tracer.h
+++ /dev/null
@@ -1,33 +0,0 @@
-/*
- * Copyright (c) Meta Platforms, Inc. and affiliates.
- * All rights reserved.
- *
- * This source code is licensed under the BSD-style license found in the
- * LICENSE file in the root directory of this source tree.
- */
-
-#include <stdlib.h>
-#include <cstdint>
-
-#pragma once
-
-namespace torch {
-namespace executor {
-
-typedef uint32_t AllocatorID;
-typedef int32_t ChainID;
-typedef uint32_t DebugHandle;
-
-/**
- * EventTracer is a class that users can inherit and implement to
- * log/serialize/stream etc. the profiling and debugging events that are
- * generated at runtime for a model. An example of this is the ETDump
- * implementation in the SDK codebase that serializes these events to a
- * flatbuffer.
- */
-class EventTracer {};
-
-struct EventTracerEntry {};
-
-} // namespace executor
-} // namespace torch
diff --git a/test/edge/event_tracer_hooks.h b/test/edge/event_tracer_hooks.h
deleted file mode 100644
index 086eae36ac8..00000000000
--- a/test/edge/event_tracer_hooks.h
+++ /dev/null
@@ -1,91 +0,0 @@
-/*
- * Copyright (c) Meta Platforms, Inc. and affiliates.
- * All rights reserved.
- *
- * This source code is licensed under the BSD-style license found in the
- * LICENSE file in the root directory of this source tree.
- */
-
-#pragma once
-
-#include <event_tracer.h>
-
-/**
- * @file
- *
- * This file contains the hooks that are inserted across various parts of the
- * core runtime code to call into the EventTracer class for logging of profiling
- * and debugging events. Any calls made to the EventTracer from the runtime must
- * be made via these hooks.
- * Users shouldn't directly add these hooks in their code and it's meant only
- * for usage in ExecuTorch internal code.
- *
- * The benefit of defining these hooks is that we can easily control whether or
- * not we want to compile in the EventTracer code based on the status of the
- * ET_EVENT_TRACER_ENABLED flag.
- */
-
-namespace torch {
-namespace executor {
-namespace internal {
-
-/**
- * This class enables scope based profiling where needed using RAII.
- * Profiling will be started when the object is created and will end
- * when the object goes out of scope.
- */
-class EventTracerProfileScope final {
- public:
-  EventTracerProfileScope(EventTracer* event_tracer, const char* name) {};
-
-  ~EventTracerProfileScope() {};
-
- private:
-  EventTracer* event_tracer_;
-  EventTracerEntry event_entry_;
-};
-
-/**
- * This class enables scope based profiling where needed using RAII.
- * Profiling will be started when the object is created and will end
- * when the object goes out of scope.
- */
-class EventTracerProfileOpScope final {
- public:
-  EventTracerProfileOpScope(EventTracer* event_tracer, const char* name) {};
-
-  ~EventTracerProfileOpScope() {};
-
- private:
-  EventTracer* event_tracer_;
-  EventTracerEntry event_entry_;
-};
-
-/**
- * This class helps us set and then clear out the chain id and debug handle
- * values stored in the event tracer class using RAII. This is typically called
- * in the executor loop before entering the codegen layer to configure the chain
- * id and debug handle of the current instruction being executed.
- * After we return from the kernel execution we can then reset the chain id and
- * debug handle to defaults when this object goes out of scope.
- */
-class EventTracerProfileInstructionScope final {
- public:
-  EventTracerProfileInstructionScope(
-      EventTracer* event_tracer,
-      ChainID chain_idx,
-      DebugHandle debug_handle) {};
-
-  ~EventTracerProfileInstructionScope() {};
-
- private:
-  EventTracer* event_tracer_;
-};
-
-void event_tracer_log_evalue(EventTracer* event_tracer, EValue& evalue) {
-  (void)evalue;
-}
-
-} // namespace internal
-} // namespace executor
-} // namespace torch
diff --git a/test/edge/kernel_runtime_context.h b/test/edge/kernel_runtime_context.h
deleted file mode 100644
index 74f6914a871..00000000000
--- a/test/edge/kernel_runtime_context.h
+++ /dev/null
@@ -1,44 +0,0 @@
-#pragma once
-
-#include "event_tracer.h"
-
-namespace torch {
-namespace executor {
-
-/**
- * Bucket type abstraction that contains many elements of runtime state that
- * a kernel author may want available, but would otherwise be unable to access.
- *
- * Forwarded along to all operators when running in lean mode. NOTE: Will not be
- * forwarded to operators if running in ATen mode as those operators do not
- * expect to receive a KernelRuntimeContext and would not use it.
- *
- * This includes things like setting an error state, a scratch allocator for
- * operators that need more then constant space, and a TensorResizer for dynamic
- * shape tensors allowing programs to be more flexible with Tensor shape.
- */
-class KernelRuntimeContext {
-  public:
-  /**
-   * Construct a new kernel runtime context along with an optional event tracer.
-   */
-  KernelRuntimeContext(EventTracer* event_tracer = nullptr)
-      : event_tracer_(event_tracer) {}
-
-  /**
-   * INTERNAL ONLY
-   *
-   * Returns a pointer to an instance of EventTracer to do profiling/debugging
-   * logging inside the codegen layer. This is only for internal usage inside
-   * the codegen layer and users should not be accessing this.
-   */
-  EventTracer* internal_event_tracer() {
-    return event_tracer_;
-  }
-
-  private:
-  EventTracer* event_tracer_;
-};
-
-} // namespace executor
-} // namespace torch
diff --git a/test/edge/operator_registry.cpp b/test/edge/operator_registry.cpp
deleted file mode 100644
index 765afa66e7a..00000000000
--- a/test/edge/operator_registry.cpp
+++ /dev/null
@@ -1,45 +0,0 @@
-#include <c10/util/Exception.h>
-#include <operator_registry.h>
-
-namespace torch {
-namespace executor {
-
-KernelRegistry& getKernelRegistry() {
-  static KernelRegistry kernel_registry;
-  return kernel_registry;
-}
-
-bool register_kernels(const ArrayRef<Kernel>& kernels) {
-  return getKernelRegistry().register_kernels(kernels);
-}
-
-bool KernelRegistry::register_kernels(
-    const ArrayRef<Kernel>& kernels) {
-  for (const auto& kernel : kernels) {
-    this->kernels_map_[kernel.name_] = kernel.kernel_;
-  }
-  return true;
-}
-
-bool hasKernelFn(const char* name) {
-  return getKernelRegistry().hasKernelFn(name);
-}
-
-bool KernelRegistry::hasKernelFn(const char* name) {
-  auto kernel = this->kernels_map_.find(name);
-  return kernel != this->kernels_map_.end();
-}
-
-KernelFunction& getKernelFn(const char* name) {
-  return getKernelRegistry().getKernelFn(name);
-}
-
-KernelFunction& KernelRegistry::getKernelFn(const char* name) {
-  auto kernel = this->kernels_map_.find(name);
-  TORCH_CHECK_MSG(kernel != this->kernels_map_.end(), "Kernel not found!");
-  return kernel->second;
-}
-
-
-} // namespace executor
-} // namespace torch
diff --git a/test/edge/operator_registry.h b/test/edge/operator_registry.h
deleted file mode 100644
index 3fd1708a8b7..00000000000
--- a/test/edge/operator_registry.h
+++ /dev/null
@@ -1,72 +0,0 @@
-#pragma once
-
-#include <cstring>
-#include <functional>
-#include <map>
-
-#include "Evalue.h"
-#include "kernel_runtime_context.h"
-
-#include <c10/util/ArrayRef.h>
-
-namespace torch {
-namespace executor {
-
-using KernelFunction = std::function<void(KernelRuntimeContext&, EValue**)>;
-
-template<typename T>
-using ArrayRef = at::ArrayRef<T>;
-
-#define EXECUTORCH_SCOPE_PROF(x)
-
-struct Kernel {
-  const char* name_;
-  KernelFunction kernel_;
-
-  Kernel() = default;
-
-  /**
-   * We are doing a copy of the string pointer instead of duplicating the string
-   * itself, we require the lifetime of the kernel name to be at least as long
-   * as the kernel registry.
-   */
-  explicit Kernel(const char* name, KernelFunction func)
-      : name_(name), kernel_(func) {}
-};
-
-/**
- * See KernelRegistry::hasKernelFn()
- */
-bool hasKernelFn(const char* name);
-
-/**
- * See KernelRegistry::getKernelFn()
- */
-KernelFunction& getKernelFn(const char* name);
-
-
-[[nodiscard]] bool register_kernels(const ArrayRef<Kernel>&);
-
-struct KernelRegistry {
- public:
-  KernelRegistry() : kernelRegSize_(0) {}
-
-  bool register_kernels(const ArrayRef<Kernel>&);
-
-  /**
-   * Checks whether an kernel with a given name is registered
-   */
-  bool hasKernelFn(const char* name);
-
-  /**
-   * Checks whether an kernel with a given name is registered
-   */
-  KernelFunction& getKernelFn(const char* name);
-
- private:
-  std::map<const char*, KernelFunction> kernels_map_;
-  uint32_t kernelRegSize_;
-};
-
-} // namespace executor
-} // namespace torch
diff --git a/test/edge/selected_operators.yaml b/test/edge/selected_operators.yaml
deleted file mode 100644
index 70545ae216f..00000000000
--- a/test/edge/selected_operators.yaml
+++ /dev/null
@@ -1,463 +0,0 @@
-build_features: []
-custom_classes: []
-include_all_non_op_selectives: false
-include_all_operators: false
-kernel_metadata: {}
-et_kernel_metadata:
-  custom::add_3.out:
-    - v1/6;0,1,2,3|6;0,1,2,3|6;0,1,2,3
-    - v1/3;0,1,2,3|3;0,1,2,3|3;0,1,2,3
-  aten::add.out:
-    - v1/6;0,1,2,3|6;0,1,2,3|6;0,1,2,3
-    - v1/3;0,1,2,3|3;0,1,2,3|3;0,1,2,3
-operators:
-  aten::_fake_quantize_per_tensor_affine_cachemask_tensor_qparams.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::_reshape_alias_copy.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::_softmax.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::_to_copy.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::_unique2.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::add.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::addmm.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::avg_pool2d.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::baddbmm.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::bitwise_and.Tensor_out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::bmm.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::cat.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::clamp.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::clone.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::constant_pad_nd.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::conv1d.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::convolution.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::cumsum.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::detach_copy.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::div.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::embedding.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::eq.Scalar_out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::eq.Tensor_out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::exp.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::expand_copy.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::floor_divide.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::gelu.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::grid_sampler_2d.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::gt.Scalar_out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::index.Tensor_out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::index_put.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::index_select.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::leaky_relu.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::linalg_inv_ex.inverse:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::logit.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::masked_fill.Scalar_out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::max.unary_out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::max_pool2d_with_indices.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::mean.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::minimum.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::mm.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::mul.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::native_batch_norm.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::native_layer_norm.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::ne.Scalar_out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::nonzero.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::permute_copy.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::pixel_shuffle.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::relu.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::remainder.Scalar_out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::repeat.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::round.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::rsub.Scalar_out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::select_copy.int_out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::sigmoid.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::slice_copy.Tensor_out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::softplus.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::sort.values:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::split_copy.Tensor_out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::split_with_sizes_copy.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::stack.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::sub.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::sum.IntList_out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::tanh.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::topk.values:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::transpose_copy.int_out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::unbind_copy.int_out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::unsafe_split.Tensor_out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::unsqueeze_copy.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::upsample_bilinear2d.vec_out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::upsample_nearest2d.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::upsample_nearest2d.vec_out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::view_copy.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  aten::zeros_like.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
-  custom::add_3.out:
-    debug_info:
-    - functions.yaml
-    include_all_overloads: false
-    is_root_operator: true
-    is_used_for_training: true
diff --git a/test/edge/templates/Functions.h b/test/edge/templates/Functions.h
deleted file mode 100644
index 5355b3890f8..00000000000
--- a/test/edge/templates/Functions.h
+++ /dev/null
@@ -1,25 +0,0 @@
-// clang-format off
-#pragma once
-#include <ATen/Context.h>
-#include <ATen/DeviceGuard.h>
-#include <ATen/TensorUtils.h>
-#include <ATen/TracerMode.h>
-#include <ATen/core/Generator.h>
-#include <ATen/core/Reduction.h>
-#include <ATen/core/Tensor.h>
-#include <c10/core/Scalar.h>
-#include <c10/core/Storage.h>
-#include <c10/core/TensorOptions.h>
-#include <c10/util/Deprecated.h>
-#include <c10/util/Optional.h>
-// ${generated_comment}
-
-${static_dispatch_extra_headers}
-
-namespace torch {
-namespace executor {
-
-${Functions_declarations}
-
-} // namespace executor
-} // namespace torch
diff --git a/test/edge/templates/NativeFunctions.h b/test/edge/templates/NativeFunctions.h
deleted file mode 100644
index c71a4ea2ec0..00000000000
--- a/test/edge/templates/NativeFunctions.h
+++ /dev/null
@@ -1,31 +0,0 @@
-#pragma once
-
-// ${generated_comment}
-
-#ifdef TORCH_ASSERT_NO_OPERATORS
-#error This change adds a dependency on native_functions.yaml,            \
-  meaning the file will need to be re-compiled every time an operator     \
-  is changed or added. Consider if your change would be better placed in  \
-  another file, or if a more specific header might achieve the same goal. \
-  See NOTE: [Tensor vs. TensorBase]
-#endif
-
-#if defined(AT_PER_OPERATOR_HEADERS) && defined(TORCH_ASSERT_ONLY_METHOD_OPERATORS)
-#error This change adds a dependency on all pytorch operators, meaning the      \
-  file will need to be re-compiled every time an operator is changed or added.  \
-  Consider including a specific operator from <ATen/ops/{my_operator}_native.h> \
-  and see NOTE [TORCH_ASSERT_ONLY_METHOD_OPERATORS].
-#endif
-
-#include <c10/core/Scalar.h>
-#include <c10/core/Storage.h>
-#include <c10/core/TensorOptions.h>
-#include <c10/util/Deprecated.h>
-#include <c10/util/Optional.h>
-#include <c10/core/QScheme.h>
-#include <ATen/core/Reduction.h>
-#include <ATen/core/Tensor.h>
-#include <tuple>
-#include <vector>
-
-${nativeFunctions_declarations}
diff --git a/test/edge/templates/RegisterCodegenUnboxedKernels.cpp b/test/edge/templates/RegisterCodegenUnboxedKernels.cpp
deleted file mode 100644
index 40c6779e939..00000000000
--- a/test/edge/templates/RegisterCodegenUnboxedKernels.cpp
+++ /dev/null
@@ -1,28 +0,0 @@
-#include <operator_registry.h>
-#include <event_tracer_hooks.h>
-#include "${fn_header}" // Generated Function import headers
-
-namespace torch {
-namespace executor {
-
-using namespace internal;
-
-namespace {
-using KernelArrayRef = ::at::ArrayRef<::torch::executor::Kernel>;
-
-static Kernel kernels_to_register[] = {
-    ${unboxed_kernels} // Generated operators
-};
-
-// Explicitly convert to ArrayRef, so that the API can take an empty C array of
-// Kernels.
-static KernelArrayRef kernel_array_ref(
-    kernels_to_register,
-    kernels_to_register + sizeof(kernels_to_register) / sizeof(Kernel));
-
-// Return value not used. Keep the static variable assignment to register
-// operators in static initialization time.
-static auto success_with_kernel_reg = register_kernels(kernel_array_ref);
-} // namespace
-} // namespace executor
-} // namespace torch
diff --git a/test/edge/templates/RegisterDispatchKeyCustomOps.cpp b/test/edge/templates/RegisterDispatchKeyCustomOps.cpp
deleted file mode 100644
index 14c3d085f93..00000000000
--- a/test/edge/templates/RegisterDispatchKeyCustomOps.cpp
+++ /dev/null
@@ -1,27 +0,0 @@
-// clang-format off
-// Generated code for registering custom operators into the dispatcher.
-
-#include <torch/library.h>
-#include <ATen/Tensor.h>
-
-$ops_headers
-
-namespace torch {
-namespace executor {
-namespace function {
-
-
-${dispatch_anonymous_definitions}
-
-// All out variants ops
-${static_init_dispatch_registrations}
-
-namespace ${dispatch_namespace}
-{
-  ${dispatch_namespaced_definitions}
-
-} // namespace ${dispatch_namespace}
-
-} // namespace function
-} // namespace executor
-} // namespace torch
diff --git a/test/edge/templates/RegisterKernels.h b/test/edge/templates/RegisterKernels.h
deleted file mode 100644
index 3c7ecff50b5..00000000000
--- a/test/edge/templates/RegisterKernels.h
+++ /dev/null
@@ -1,22 +0,0 @@
-/*
- * Copyright (c) Meta Platforms, Inc. and affiliates.
- * All rights reserved.
- *
- * This source code is licensed under the BSD-style license found in the
- * LICENSE file in the root directory of this source tree.
- */
-
-// ${generated_comment}
-// Exposing an API for registering all kernels at once.
-#include <executorch/runtime/core/evalue.h>
-#include <executorch/runtime/core/exec_aten/exec_aten.h>
-#include <executorch/runtime/kernel/operator_registry.h>
-#include <executorch/runtime/platform/profiler.h>
-
-namespace torch {
-namespace executor {
-
-Error register_all_kernels();
-
-} // namespace executor
-} // namespace torch
diff --git a/test/edge/templates/RegisterSchema.cpp b/test/edge/templates/RegisterSchema.cpp
deleted file mode 100644
index f2ba92a4305..00000000000
--- a/test/edge/templates/RegisterSchema.cpp
+++ /dev/null
@@ -1,10 +0,0 @@
-// ${generated_comment}
-#define TORCH_ASSERT_ONLY_METHOD_OPERATORS
-#include <torch/library.h>
-
-namespace at {
-TORCH_LIBRARY_FRAGMENT(aten, m) {
-    ${aten_schema_registrations};
-}
-$schema_registrations
-} // namespace at
diff --git a/test/edge/test_main.cpp b/test/edge/test_main.cpp
deleted file mode 100644
index 5c5cabccaaa..00000000000
--- a/test/edge/test_main.cpp
+++ /dev/null
@@ -1,18 +0,0 @@
-#include <gtest/gtest.h>
-
-std::string add_negative_flag(const std::string& flag) {
-  std::string filter = ::testing::GTEST_FLAG(filter);
-  if (filter.find('-') == std::string::npos) {
-    filter.push_back('-');
-  } else {
-    filter.push_back(':');
-  }
-  filter += flag;
-  return filter;
-}
-int main(int argc, char* argv[]) {
-    ::testing::InitGoogleTest(&argc, argv);
-    ::testing::GTEST_FLAG(filter) = add_negative_flag("*_CUDA:*_MultiCUDA");
-
-    return RUN_ALL_TESTS();
-}
diff --git a/test/edge/test_operator_registration.cpp b/test/edge/test_operator_registration.cpp
deleted file mode 100644
index eed4c31c70c..00000000000
--- a/test/edge/test_operator_registration.cpp
+++ /dev/null
@@ -1,53 +0,0 @@
-#include "kernel_runtime_context.h"
-#include "operator_registry.h"
-
-#include <gtest/gtest.h>
-
-namespace torch {
-namespace executor {
-
-// add.out(Tensor self, Tensor other, *, Scalar alpha=1, Tensor(a!) out) -> Tensor(a!)
-TEST(OperatorRegistrationTest, Add) {
-    EValue values[4];
-    values[0] = EValue(at::ones({2, 3}));
-    values[1] = EValue(at::ones({2, 3}));
-    values[2] = EValue(int64_t(1));
-    values[3] = EValue(at::zeros({2, 3}));
-    ASSERT_TRUE(hasKernelFn("aten::add.out"));
-    auto op = getKernelFn("aten::add.out");
-
-    EValue* kernel_values[4];
-    for (size_t i = 0; i < 4; i++) {
-        kernel_values[i] = &values[i];
-    }
-    KernelRuntimeContext context{};
-    op(context, kernel_values);
-    at::Tensor expected = at::ones({2, 3});
-    expected = at::fill(expected, 2);
-    ASSERT_TRUE(expected.equal(kernel_values[3]->toTensor()));
-
-}
-
-// custom::add_3.out(Tensor a, Tensor b, Tensor c, *, Tensor(a!) out) -> Tensor(a!)
-TEST(OperatorRegistrationTest, CustomAdd3) {
-    EValue values[4];
-    values[0] = EValue(at::ones({2, 3}));
-    values[1] = EValue(at::ones({2, 3}));
-    values[2] = EValue(at::ones({2, 3}));
-    values[3] = EValue(at::zeros({2, 3}));
-    ASSERT_TRUE(hasKernelFn("custom::add_3.out"));
-    auto op = getKernelFn("custom::add_3.out");
-
-    EValue* kernel_values[4];
-    for (size_t i = 0; i < 4; i++) {
-        kernel_values[i] = &values[i];
-    }
-    KernelRuntimeContext context{};
-    op(context, kernel_values);
-    at::Tensor expected = at::ones({2, 3});
-    expected = at::fill(expected, 3);
-    ASSERT_TRUE(expected.equal(kernel_values[3]->toTensor()));
-
-}
-} // namespace executor
-} // namespace torch
diff --git a/tools/BUCK.bzl b/tools/BUCK.bzl
index 86a48bbc246..5b25c5caeb1 100644
--- a/tools/BUCK.bzl
+++ b/tools/BUCK.bzl
@@ -287,18 +287,3 @@ def define_tools_targets(
             ":autograd",
         ],
     )
-
-    python_test(
-        name = "test_torchgen_executorch",
-        srcs = [
-            "test/test_executorch_gen.py",
-            "test/test_executorch_signatures.py",
-            "test/test_executorch_types.py",
-            "test/test_executorch_unboxing.py",
-        ],
-        contacts = contacts,
-        visibility = ["PUBLIC"],
-        deps = [
-            torchgen_deps,
-        ],
-    )
diff --git a/tools/test/test_executorch_custom_ops.py b/tools/test/test_executorch_custom_ops.py
deleted file mode 100644
index 767fe0580b1..00000000000
--- a/tools/test/test_executorch_custom_ops.py
+++ /dev/null
@@ -1,147 +0,0 @@
-from __future__ import annotations
-
-import tempfile
-import unittest
-from typing import Any
-from unittest.mock import ANY, Mock, patch
-
-import expecttest
-
-import torchgen
-from torchgen.executorch.api.custom_ops import ComputeNativeFunctionStub
-from torchgen.executorch.model import ETKernelIndex
-from torchgen.gen_executorch import gen_headers
-from torchgen.model import Location, NativeFunction
-from torchgen.selective_build.selector import SelectiveBuilder
-from torchgen.utils import FileManager
-
-
-SPACES = "    "
-
-
-def _get_native_function_from_yaml(yaml_obj: dict[str, object]) -> NativeFunction:
-    native_function, _ = NativeFunction.from_yaml(
-        yaml_obj,
-        loc=Location(__file__, 1),
-        valid_tags=set(),
-    )
-    return native_function
-
-
-class TestComputeNativeFunctionStub(expecttest.TestCase):
-    """
-    Could use torch.testing._internal.common_utils to reduce boilerplate.
-    GH CI job doesn't build torch before running tools unit tests, hence
-    manually adding these parametrized tests.
-    """
-
-    def _test_function_schema_generates_correct_kernel(
-        self, obj: dict[str, Any], expected: str
-    ) -> None:
-        func = _get_native_function_from_yaml(obj)
-
-        gen = ComputeNativeFunctionStub()
-        res = gen(func)
-        self.assertIsNotNone(res)
-        self.assertExpectedInline(
-            str(res),
-            expected,
-        )
-
-    def test_function_schema_generates_correct_kernel_tensor_out(self) -> None:
-        obj = {"func": "custom::foo.out(Tensor self, *, Tensor(a!) out) -> Tensor(a!)"}
-        expected = """
-at::Tensor & wrapper_CPU_out_foo_out(const at::Tensor & self, at::Tensor & out) {
-    return out;
-}
-    """
-        self._test_function_schema_generates_correct_kernel(obj, expected)
-
-    def test_function_schema_generates_correct_kernel_no_out(self) -> None:
-        obj = {"func": "custom::foo.Tensor(Tensor self) -> Tensor"}
-        expected = """
-at::Tensor wrapper_CPU_Tensor_foo(const at::Tensor & self) {
-    return self;
-}
-    """
-        self._test_function_schema_generates_correct_kernel(obj, expected)
-
-    def test_function_schema_generates_correct_kernel_no_return(self) -> None:
-        obj = {"func": "custom::foo.out(Tensor self, *, Tensor(a!)[] out) -> ()"}
-        expected = f"""
-void wrapper_CPU_out_foo_out(const at::Tensor & self, at::TensorList out) {{
-{SPACES}
-}}
-    """
-        self._test_function_schema_generates_correct_kernel(obj, expected)
-
-    def test_function_schema_generates_correct_kernel_3_returns(self) -> None:
-        obj = {
-            "func": "custom::foo(Tensor self, Tensor[] other) -> (Tensor, Tensor, Tensor)"
-        }
-        expected = """
-::std::tuple<at::Tensor,at::Tensor,at::Tensor> wrapper_CPU__foo(const at::Tensor & self, at::TensorList other) {
-    return ::std::tuple<at::Tensor, at::Tensor, at::Tensor>(
-                at::Tensor(), at::Tensor(), at::Tensor()
-            );
-}
-    """
-        self._test_function_schema_generates_correct_kernel(obj, expected)
-
-    def test_function_schema_generates_correct_kernel_1_return_no_out(self) -> None:
-        obj = {"func": "custom::foo(Tensor[] a) -> Tensor"}
-        expected = """
-at::Tensor wrapper_CPU__foo(at::TensorList a) {
-    return at::Tensor();
-}
-    """
-        self._test_function_schema_generates_correct_kernel(obj, expected)
-
-    def test_schema_has_no_return_type_argument_throws(self) -> None:
-        func = _get_native_function_from_yaml(
-            {"func": "custom::foo.bool(Tensor self) -> bool"}
-        )
-
-        gen = ComputeNativeFunctionStub()
-        with self.assertRaisesRegex(Exception, "Can't handle this return type"):
-            gen(func)
-
-
-class TestGenCustomOpsHeader(unittest.TestCase):
-    @patch.object(torchgen.utils.FileManager, "write_with_template")
-    @patch.object(torchgen.utils.FileManager, "write")
-    def test_fm_writes_custom_ops_header_when_boolean_is_true(
-        self, unused: Mock, mock_method: Mock
-    ) -> None:
-        with tempfile.TemporaryDirectory() as tempdir:
-            fm = FileManager(tempdir, tempdir, False)
-            gen_headers(
-                native_functions=[],
-                gen_custom_ops_header=True,
-                custom_ops_native_functions=[],
-                selector=SelectiveBuilder.get_nop_selector(),
-                kernel_index=ETKernelIndex(index={}),
-                cpu_fm=fm,
-                use_aten_lib=False,
-            )
-            mock_method.assert_called_once_with(
-                "CustomOpsNativeFunctions.h", "NativeFunctions.h", ANY
-            )
-
-    @patch.object(torchgen.utils.FileManager, "write_with_template")
-    @patch.object(torchgen.utils.FileManager, "write")
-    def test_fm_doesnot_writes_custom_ops_header_when_boolean_is_false(
-        self, unused: Mock, mock_method: Mock
-    ) -> None:
-        with tempfile.TemporaryDirectory() as tempdir:
-            fm = FileManager(tempdir, tempdir, False)
-            gen_headers(
-                native_functions=[],
-                gen_custom_ops_header=False,
-                custom_ops_native_functions=[],
-                selector=SelectiveBuilder.get_nop_selector(),
-                kernel_index=ETKernelIndex(index={}),
-                cpu_fm=fm,
-                use_aten_lib=False,
-            )
-            mock_method.assert_not_called()
diff --git a/tools/test/test_executorch_gen.py b/tools/test/test_executorch_gen.py
deleted file mode 100644
index 9448265aa71..00000000000
--- a/tools/test/test_executorch_gen.py
+++ /dev/null
@@ -1,689 +0,0 @@
-from __future__ import annotations
-
-import os
-import tempfile
-import unittest
-
-import yaml
-
-from torchgen.executorch.model import ETKernelIndex, ETKernelKey
-from torchgen.gen import LineLoader
-from torchgen.gen_executorch import (
-    ComputeCodegenUnboxedKernels,
-    gen_functions_declarations,
-    parse_yaml_files,
-    translate_native_yaml,
-)
-from torchgen.model import (
-    BackendIndex,
-    BackendMetadata,
-    DispatchKey,
-    Location,
-    NativeFunction,
-    OperatorName,
-)
-from torchgen.selective_build.selector import SelectiveBuilder
-
-
-TEST_YAML = """
-- func: add.out(Tensor self, Tensor other, *, Scalar alpha=1, Tensor(a!) out) -> Tensor(a!)
-  device_check: NoCheck   # TensorIterator
-  structured: True
-  structured_inherits: TensorIteratorBase
-  ufunc_inner_loop:
-    Generic: add (AllAndComplex, BFloat16, Half, ComplexHalf)
-    ScalarOnly: add (Bool)
-  dispatch:
-    SparseCPU: add_out_sparse_cpu
-    SparseCUDA: add_out_sparse_cuda
-    SparseCsrCPU: add_out_sparse_csr_cpu
-    SparseCsrCUDA: add_out_sparse_csr_cuda
-    MkldnnCPU: mkldnn_add_out
-    MPS: add_out_mps
-
-- func: add.Tensor(Tensor self, Tensor other, *, Scalar alpha=1) -> Tensor
-  device_check: NoCheck   # TensorIterator
-  structured_delegate: add.out
-  variants: function, method
-  dispatch:
-    SparseCPU, SparseCUDA: add_sparse
-    SparseCsrCPU, SparseCsrCUDA: add_sparse_csr
-    MkldnnCPU: mkldnn_add
-    ZeroTensor: add_zerotensor
-    NestedTensorCPU, NestedTensorCUDA: NestedTensor_add_Tensor
-  tags: core
-
-- func: mul.out(Tensor self, Tensor other, *, Tensor(a!) out) -> Tensor(a!)
-  device_check: NoCheck   # TensorIterator
-  structured: True
-  structured_inherits: TensorIteratorBase
-  dispatch:
-    CPU, CUDA: mul_out
-    MPS: mul_out_mps
-    SparseCPU: mul_out_sparse_cpu
-    SparseCUDA: mul_out_sparse_cuda
-    SparseCsrCPU, SparseCsrCUDA: mul_out_sparse_csr
-    MkldnnCPU: mkldnn_mul_out
-
-- func: mul.Tensor(Tensor self, Tensor other) -> Tensor
-  device_check: NoCheck   # TensorIterator
-  structured_delegate: mul.out
-  variants: function, method
-  dispatch:
-    SparseCPU, SparseCUDA: mul_sparse
-    SparseCsrCPU, SparseCsrCUDA: mul_sparse_csr
-    MkldnnCPU: mkldnn_mul
-    ZeroTensor: mul_zerotensor
-    NestedTensorCPU, NestedTensorCUDA: NestedTensor_mul_Tensor
-  tags: core
-
-"""
-
-
-TEST_KERNEL_YAML = """
-- func: add.out(Tensor self, Tensor other, *, Scalar alpha=1, Tensor(a!) out) -> Tensor(a!)
-  device_check: NoCheck   # TensorIterator
-  structured: True
-  structured_inherits: TensorIteratorBase
-  ufunc_inner_loop:
-    Generic: add (AllAndComplex, BFloat16, Half, ComplexHalf)
-    ScalarOnly: add (Bool)
-  type_alias:
-    T0: [Float, Double]
-    T1: [Double, Int]
-  dim_order_alias:
-    D0: [0, 1, 2, 3]
-    D1: [0, 3, 2, 1]
-  kernels:
-    - arg_meta: null
-      kernel_name: default_impl
-    - arg_meta:
-        self: [T0, D0]
-        other: [T1, D0]
-        out: [T0, D0]
-      kernel_name: test_impl
-    - arg_meta:
-        self: [T1, D0]
-        other: [T1, D1]
-        out: [T0, D1]
-      kernel_name: test_impl_2
-
-- func: add.Tensor(Tensor self, Tensor other, *, Scalar alpha=1) -> Tensor
-  device_check: NoCheck   # TensorIterator
-  structured_delegate: add.out
-  variants: function, method
-  tags: core
-
-- func: mul.out(Tensor self, Tensor other, *, Tensor(a!) out) -> Tensor(a!)
-  device_check: NoCheck   # TensorIterator
-  structured: True
-  structured_inherits: TensorIteratorBase
-  type_alias:
-    T0: [Float]
-    T1: [Double]
-  dim_order_alias:
-    D0: [0, 1, 2, 3]
-  kernels:
-    - arg_meta: null
-      kernel_name: default_impl
-    - arg_meta:
-        self: [T0, D0]
-        other: [T1, D0]
-        out: [T0, D0]
-      kernel_name: test_impl
-
-- func: mul.Tensor(Tensor self, Tensor other) -> Tensor
-  device_check: NoCheck   # TensorIterator
-  structured_delegate: mul.out
-  variants: function, method
-  tags: core
-
-"""
-
-
-class TestParseNativeYaml(unittest.TestCase):
-    def setUp(self) -> None:
-        self.temp_dir = tempfile.mkdtemp()
-
-        self.aten_yaml_path = os.path.join(self.temp_dir, "test_native_functions.yaml")
-        with open(self.aten_yaml_path, "w") as f:
-            f.write(TEST_YAML)
-        self.ops_yaml_path = os.path.join(self.temp_dir, "test.yaml")
-        self.tags_yaml_path = os.path.join(self.temp_dir, "tags.yaml")
-        with open(self.tags_yaml_path, "w") as f:
-            f.write(
-                """
-- tag: core
-  desc: test
-            """
-            )
-        with open(self.ops_yaml_path, "w") as f:
-            f.write(
-                """
-- op: add.out
-  device_check: NoCheck   # TensorIterator
-  dispatch:
-    CPU: torch::executor::add_out_kernel
-
-- op: mul.out
-  device_check: NoCheck   # TensorIterator
-  dispatch:
-    CPU: torch::executor::mul_out_kernel
-                """
-            )
-
-    def test_translate_native_yaml_writes_correct_data(self) -> None:
-        out_yaml_path = os.path.join(self.temp_dir, "out.yaml")
-        with open(out_yaml_path, "w") as out_file:
-            translate_native_yaml(
-                tags_yaml_path=self.tags_yaml_path,
-                aten_yaml_path=self.aten_yaml_path,
-                native_yaml_path=self.ops_yaml_path,
-                use_aten_lib=False,
-                out_file=out_file,
-            )
-        with open(out_yaml_path) as out_file:
-            es = yaml.load(out_file, Loader=LineLoader)
-        self.assertTrue(all("func" in e for e in es))
-        self.assertTrue(all(e.get("variants") == "function" for e in es))
-
-        # Check that kernel fields aren't introduced in yaml
-        for e in es:
-            self.assertFalse({"kernels", "type_alias", "dim_order_alias"} < e.keys())
-
-    def test_parse_yaml_files(self) -> None:
-        custom_ops_yaml_path = None
-        selector = SelectiveBuilder.get_nop_selector()
-        use_aten_lib = False
-
-        parsed_yaml, custom_ops_parsed_yaml = parse_yaml_files(
-            aten_yaml_path=self.aten_yaml_path,
-            tags_yaml_path=self.tags_yaml_path,
-            native_yaml_path=self.ops_yaml_path,
-            custom_ops_yaml_path=custom_ops_yaml_path,
-            selector=selector,
-            use_aten_lib=use_aten_lib,
-        )
-
-        # Just the default kernel entry
-        expected_kernel_entry = {"add.out": 1, "mul.out": 1}
-        self.assertTrue(len(parsed_yaml.native_functions) == len(expected_kernel_entry))
-
-        op_entries = parsed_yaml.kernel_index.index
-        for op_name, kernel_mapping in op_entries.items():
-            self.assertTrue(
-                len(kernel_mapping) == expected_kernel_entry.pop(str(op_name))
-            )
-
-        self.assertTrue(len(expected_kernel_entry) == 0)
-
-    def tearDown(self) -> None:
-        import shutil
-
-        try:
-            shutil.rmtree(self.temp_dir)
-        except OSError:
-            pass
-
-
-class TestParseKernelYamlFiles(unittest.TestCase):
-    def setUp(self) -> None:
-        self.temp_dir = tempfile.mkdtemp()
-
-        self.aten_kernel_yaml_path = os.path.join(
-            self.temp_dir, "test_kernel_native_functions.yaml"
-        )
-        with open(self.aten_kernel_yaml_path, "w") as f:
-            f.write(TEST_KERNEL_YAML)
-        self.ops_yaml_path = os.path.join(self.temp_dir, "test.yaml")
-        self.tags_yaml_path = os.path.join(self.temp_dir, "tags.yaml")
-        with open(self.tags_yaml_path, "w") as f:
-            f.write(
-                """
-- tag: core
-  desc: test
-            """
-            )
-        with open(self.ops_yaml_path, "w") as f:
-            f.write(
-                """
-- op: add.out
-  device_check: NoCheck   # TensorIterator
-  dispatch:
-    CPU: torch::executor::add_out_kernel
-
-- op: mul.out
-  device_check: NoCheck   # TensorIterator
-  dispatch:
-    CPU: torch::executor::mul_out_kernel
-                """
-            )
-
-    def test_translate_kernel_native_yaml_writes_correct_data(self) -> None:
-        out_yaml_path = os.path.join(self.temp_dir, "out2.yaml")
-        with open(out_yaml_path, "w") as out_file:
-            translate_native_yaml(
-                tags_yaml_path=self.tags_yaml_path,
-                aten_yaml_path=self.aten_kernel_yaml_path,
-                native_yaml_path=self.ops_yaml_path,
-                use_aten_lib=False,
-                out_file=out_file,
-            )
-        with open(out_yaml_path) as out_file:
-            es = yaml.load(out_file, Loader=LineLoader)
-        self.assertTrue(all("func" in e for e in es))
-        self.assertTrue(all(e.get("variants") == "function" for e in es))
-
-        # Check persistence of kernel fields in yaml
-        for e in es:
-            self.assertTrue({"kernels", "type_alias", "dim_order_alias"} < e.keys())
-
-    def test_parse_yaml_files(self) -> None:
-        custom_ops_yaml_path = None
-        selector = SelectiveBuilder.get_nop_selector()
-        use_aten_lib = False
-
-        parsed_yaml, custom_ops_parsed_yaml = parse_yaml_files(
-            aten_yaml_path=self.aten_kernel_yaml_path,
-            tags_yaml_path=self.tags_yaml_path,
-            native_yaml_path=self.ops_yaml_path,
-            custom_ops_yaml_path=custom_ops_yaml_path,
-            selector=selector,
-            use_aten_lib=use_aten_lib,
-        )
-
-        expected_kernel_entry = {"add.out": 9, "mul.out": 2}
-        self.assertTrue(len(parsed_yaml.native_functions) == len(expected_kernel_entry))
-
-        op_entries = parsed_yaml.kernel_index.index
-        for op_name, kernel_mapping in op_entries.items():
-            self.assertTrue(
-                len(kernel_mapping) == expected_kernel_entry.pop(str(op_name))
-            )
-
-        self.assertTrue(len(expected_kernel_entry) == 0)
-
-    def tearDown(self) -> None:
-        import shutil
-
-        try:
-            shutil.rmtree(self.temp_dir)
-        except OSError:
-            pass
-
-
-class TestGenFunctionsDeclarations(unittest.TestCase):
-    def setUp(self) -> None:
-        (
-            self.custom_1_native_function,
-            custom_1_backend_index,
-        ) = NativeFunction.from_yaml(
-            {"func": "custom_1::op_1() -> bool", "dispatch": {"CPU": "kernel_1"}},
-            loc=Location(__file__, 1),
-            valid_tags=set(),
-        )
-        (
-            self.custom_2_native_function,
-            custom_2_backend_index,
-        ) = NativeFunction.from_yaml(
-            {
-                "func": "custom_2::op_2() -> bool",
-                "dispatch": {"CPU": "kernel_2"},
-            },
-            loc=Location(__file__, 1),
-            valid_tags=set(),
-        )
-        (
-            self.custom_3_native_function,
-            custom_3_backend_index,
-        ) = NativeFunction.from_yaml(
-            {
-                "func": "custom_3::op_3(Tensor(a!) self, Tensor x) -> Tensor(a!)",
-                "dispatch": {"CPU": "kernel_3"},
-                "variants": "method",
-            },
-            loc=Location(__file__, 1),
-            valid_tags=set(),
-        )
-
-        backend_indices: dict[DispatchKey, dict[OperatorName, BackendMetadata]] = {
-            DispatchKey.CPU: {},
-            DispatchKey.QuantizedCPU: {},
-        }
-        BackendIndex.grow_index(backend_indices, custom_1_backend_index)
-        BackendIndex.grow_index(backend_indices, custom_2_backend_index)
-        self.static_dispatch_idx = [
-            BackendIndex(
-                dispatch_key=k,
-                use_out_as_primary=True,
-                external=False,
-                device_guard=False,
-                index=backend_indices[k],
-            )
-            for k in backend_indices
-        ]
-        self.kernel_index = ETKernelIndex.from_backend_indices(backend_indices)
-
-    def test_operators_with_different_namespaces_are_grouped_correctly(self) -> None:
-        declarations = gen_functions_declarations(
-            native_functions=[
-                self.custom_1_native_function,
-                self.custom_2_native_function,
-            ],
-            kernel_index=self.kernel_index,
-            selector=SelectiveBuilder.get_nop_selector(),
-            use_aten_lib=False,
-        )
-        self.assertTrue(
-            """
-namespace custom_1 {
-
-// custom_1::op_1() -> bool
-TORCH_API inline bool op_1(torch::executor::KernelRuntimeContext & context) {
-    return ::at::native::kernel_1(context);
-}
-
-} // namespace custom_1
-"""
-            in declarations
-        )
-
-        self.assertTrue(
-            """
-namespace custom_2 {
-
-// custom_2::op_2() -> bool
-TORCH_API inline bool op_2(torch::executor::KernelRuntimeContext & context) {
-    return ::at::native::kernel_2(context);
-}
-
-} // namespace custom_2
-        """
-            in declarations
-        )
-
-    def test_aten_lib_has_context_arg(self) -> None:
-        declarations = gen_functions_declarations(
-            native_functions=[
-                self.custom_1_native_function,
-            ],
-            kernel_index=self.kernel_index,
-            selector=SelectiveBuilder.get_nop_selector(),
-            use_aten_lib=True,
-        )
-        self.assertTrue(
-            """
-namespace custom_1 {
-
-// custom_1::op_1() -> bool
-TORCH_API inline bool op_1(torch::executor::KernelRuntimeContext & context) {
-    return at::op_1();
-}
-
-} // namespace custom_1
-        """
-            in declarations
-        )
-
-    def test_aten_lib_method_variant(self) -> None:
-        declarations = gen_functions_declarations(
-            native_functions=[
-                self.custom_3_native_function,
-            ],
-            kernel_index=self.kernel_index,
-            selector=SelectiveBuilder.get_nop_selector(),
-            use_aten_lib=True,
-        )
-        self.assertTrue(
-            """
-namespace custom_3 {
-
-// custom_3::op_3(Tensor(a!) self, Tensor x) -> Tensor(a!)
-TORCH_API inline at::Tensor & op_3(torch::executor::KernelRuntimeContext & context, at::Tensor & self, const at::Tensor & x) {
-    return self.op_3(x);
-}
-
-} // namespace custom_3
-        """
-            in declarations
-        )
-
-
-class TestComputeCodegenUnboxedKernels(unittest.TestCase):
-    def setUp(self) -> None:
-        (
-            self.native_function_no_kern,
-            _,
-        ) = NativeFunction.from_yaml(
-            {
-                "func": "custom_1::op_1() -> bool",
-                "dispatch": {"CPU": "unused_kernel_1"},
-            },
-            loc=Location(__file__, 1),
-            valid_tags=set(),
-        )
-
-        self.default_kernel_key = ETKernelKey(default=True)
-        self.default_backend_metadata = BackendMetadata(
-            "default_kernel", False, "at::native"
-        )
-        self.default_kernel_entry = (
-            [self.default_kernel_key],
-            self.default_backend_metadata,
-        )
-
-    def test_codegen_unboxed_specialized(self) -> None:
-        specialized_kernel_key = ETKernelKey.gen_from_yaml(
-            {"self": ("T0", "D0"), "other": ("T0", "D0"), "out": ("T0", "D0")},
-            {"T0": ["Double"]},
-            {"D0": [0, 1, 2, 3]},
-        )
-        selector = SelectiveBuilder.from_yaml_dict(
-            {
-                "include_all_operators": True,
-                "et_kernel_metadata": {
-                    "custom_1::op_1": ["v1/7;0,1,2,3|7;0,1,2,3|7;0,1,2,3"]
-                },
-            }
-        )
-        use_aten_lib = False
-        entry = (
-            self.native_function_no_kern,
-            (specialized_kernel_key, self.default_backend_metadata),
-        )
-
-        result = ComputeCodegenUnboxedKernels(
-            selector, use_aten_lib, add_exception_boundary=False
-        )(entry)
-        # Concat used to prevent whitespace stripping
-        expected_str = (
-            """
-Kernel(
-    "custom_1::op_1",
-    "v1/7;0,1,2,3|7;0,1,2,3|7;0,1,2,3",
-    [](torch::executor::KernelRuntimeContext & context, EValue** stack) {
-        """
-            + """
-
-
-        internal::EventTracerProfileOpScope event_tracer_op_scope(context.internal_event_tracer(), "native_call_op_1");
-        EXECUTORCH_SCOPE_PROF("native_call_op_1");
-        bool result_ = at::native::default_kernel(context, );
-        internal::event_tracer_log_evalue(context.internal_event_tracer(), *stack[0]);
-
-        *stack[0] = EValue(result_);
-
-    }
-),
-"""
-        )
-
-        self.assertEqual(expected_str, result)
-
-    def test_codegen_unboxed_specialized_not_matching(self) -> None:
-        specialized_kernel_key = ETKernelKey.gen_from_yaml(
-            {"self": ("T0", "D0"), "other": ("T0", "D0"), "out": ("T0", "D0")},
-            {"T0": ["Double"]},
-            {"D0": [0, 1, 2, 3]},
-        )
-        selector = SelectiveBuilder.from_yaml_dict(
-            {
-                "include_all_operators": True,
-                "et_kernel_metadata": {
-                    "custom_1::op_1": ["v1/8;0,1,2,3|7;0,1,2,3|7;0,1,2,3"]
-                },
-            }
-        )
-        use_aten_lib = False
-        entry = (
-            self.native_function_no_kern,
-            (specialized_kernel_key, self.default_backend_metadata),
-        )
-
-        self.assertRaises(
-            Exception,
-            ComputeCodegenUnboxedKernels(
-                selector, use_aten_lib, add_exception_boundary=False
-            ),
-            entry,
-        )
-
-    def test_codegen_unboxed_specialized_missing_root_op(self) -> None:
-        specialized_kernel_key = ETKernelKey.gen_from_yaml(
-            {"self": ("T0", "D0"), "other": ("T0", "D0"), "out": ("T0", "D0")},
-            {"T0": ["Double"]},
-            {"D0": [0, 1, 2, 3]},
-        )
-        selector = SelectiveBuilder.from_yaml_dict(
-            {
-                "et_kernel_metadata": {
-                    "custom_1::op_1": ["v1/7;0,1,2,3|7;0,1,2,3|7;0,1,2,3"]
-                }
-            }
-        )
-        use_aten_lib = False
-        entry = (
-            self.native_function_no_kern,
-            (specialized_kernel_key, self.default_backend_metadata),
-        )
-
-        for add_exception_boundary in (True, False):
-            result = ComputeCodegenUnboxedKernels(
-                selector, use_aten_lib, add_exception_boundary
-            )(entry)
-            # Concat used to prevent whitespace stripping
-            expected_str = """"""
-
-            self.assertEqual(expected_str, result)
-
-    def test_codegen_unboxed_default(self) -> None:
-        """
-        This test checks that if there is no specialized kernel, the default kernel is used.
-        """
-        selector = SelectiveBuilder.from_yaml_dict(
-            {
-                "include_all_operators": True,
-                "et_kernel_metadata": {
-                    "custom_1::op_1": ["v1/7;0,1,2,3|7;0,1,2,3|7;0,1,2,3"]
-                },
-            }
-        )
-        use_aten_lib = False
-        entry = (self.native_function_no_kern, self.default_kernel_entry)
-
-        result = ComputeCodegenUnboxedKernels(
-            selector, use_aten_lib, add_exception_boundary=False
-        )(entry)
-        # Concat used to prevent whitespace stripping
-        expected_str = (
-            """
-Kernel(
-    "custom_1::op_1",
-    [](torch::executor::KernelRuntimeContext & context, EValue** stack) {
-        """
-            + """
-
-
-        internal::EventTracerProfileOpScope event_tracer_op_scope(context.internal_event_tracer(), "native_call_op_1");
-        EXECUTORCH_SCOPE_PROF("native_call_op_1");
-        bool result_ = at::native::default_kernel(context, );
-        internal::event_tracer_log_evalue(context.internal_event_tracer(), *stack[0]);
-
-        *stack[0] = EValue(result_);
-
-    }
-),
-"""
-        )
-
-        self.assertEqual(expected_str, result)
-
-        result = ComputeCodegenUnboxedKernels(
-            selector, use_aten_lib, add_exception_boundary=True
-        )(entry)
-        # Concat used to prevent whitespace stripping
-        expected_str = (
-            """
-Kernel(
-    "custom_1::op_1",
-    [](torch::executor::KernelRuntimeContext & context, EValue** stack) {
-        """
-            + """
-
-        try {
-        internal::EventTracerProfileOpScope event_tracer_op_scope(context.internal_event_tracer(), "native_call_op_1");
-        EXECUTORCH_SCOPE_PROF("native_call_op_1");
-        bool result_ = at::native::default_kernel(context, );
-        internal::event_tracer_log_evalue(context.internal_event_tracer(), *stack[0]);
-
-        *stack[0] = EValue(result_);
-        } catch (const std::exception& ex) {
-          ET_LOG(Error, "Kernel threw an exception: %s", ex.what());
-          context.fail(torch::executor::Error::Internal);
-        }
-    }
-),
-"""
-        )
-        self.maxDiff = None
-        self.assertEqual(expected_str, result)
-
-    def test_codegen_unboxed_default_kernel_key_selected(self) -> None:
-        """
-        This test checks that if there is no specialized kernel, the default kernel is used, when the selector only has default key.
-        """
-        selector = SelectiveBuilder.from_yaml_dict(
-            {
-                "include_all_operators": True,
-                "et_kernel_metadata": {"custom_1::op_1": ["default"]},
-            }
-        )
-        use_aten_lib = False
-        entry = (self.native_function_no_kern, self.default_kernel_entry)
-
-        result = ComputeCodegenUnboxedKernels(
-            selector, use_aten_lib, add_exception_boundary=False
-        )(entry)
-        # Concat used to prevent whitespace stripping
-        expected_str = (
-            """
-Kernel(
-    "custom_1::op_1",
-    [](torch::executor::KernelRuntimeContext & context, EValue** stack) {
-        """
-            + """
-
-
-        internal::EventTracerProfileOpScope event_tracer_op_scope(context.internal_event_tracer(), "native_call_op_1");
-        EXECUTORCH_SCOPE_PROF("native_call_op_1");
-        bool result_ = at::native::default_kernel(context, );
-        internal::event_tracer_log_evalue(context.internal_event_tracer(), *stack[0]);
-
-        *stack[0] = EValue(result_);
-
-    }
-),
-"""
-        )
-
-        self.assertEqual(expected_str, result)
diff --git a/tools/test/test_executorch_signatures.py b/tools/test/test_executorch_signatures.py
deleted file mode 100644
index 79f291aba3d..00000000000
--- a/tools/test/test_executorch_signatures.py
+++ /dev/null
@@ -1,59 +0,0 @@
-import unittest
-
-from torchgen.executorch.api.types import ExecutorchCppSignature
-from torchgen.local import parametrize
-from torchgen.model import Location, NativeFunction
-
-
-DEFAULT_NATIVE_FUNCTION, _ = NativeFunction.from_yaml(
-    {"func": "foo.out(Tensor input, *, Tensor(a!) out) -> Tensor(a!)"},
-    loc=Location(__file__, 1),
-    valid_tags=set(),
-)
-
-
-class ExecutorchCppSignatureTest(unittest.TestCase):
-    def setUp(self) -> None:
-        self.sig = ExecutorchCppSignature.from_native_function(DEFAULT_NATIVE_FUNCTION)
-
-    def test_runtime_signature_contains_runtime_context(self) -> None:
-        # test if `KernelRuntimeContext` argument exists in `RuntimeSignature`
-        with parametrize(
-            use_const_ref_for_mutable_tensors=False, use_ilistref_for_tensor_lists=False
-        ):
-            args = self.sig.arguments(include_context=True)
-            self.assertEqual(len(args), 3)
-            self.assertTrue(any(a.name == "context" for a in args))
-
-    def test_runtime_signature_does_not_contain_runtime_context(self) -> None:
-        # test if `KernelRuntimeContext` argument is missing in `RuntimeSignature`
-        with parametrize(
-            use_const_ref_for_mutable_tensors=False, use_ilistref_for_tensor_lists=False
-        ):
-            args = self.sig.arguments(include_context=False)
-            self.assertEqual(len(args), 2)
-            self.assertFalse(any(a.name == "context" for a in args))
-
-    def test_runtime_signature_declaration_correct(self) -> None:
-        with parametrize(
-            use_const_ref_for_mutable_tensors=False, use_ilistref_for_tensor_lists=False
-        ):
-            decl = self.sig.decl(include_context=True)
-            self.assertEqual(
-                decl,
-                (
-                    "torch::executor::Tensor & foo_outf("
-                    "torch::executor::KernelRuntimeContext & context, "
-                    "const torch::executor::Tensor & input, "
-                    "torch::executor::Tensor & out)"
-                ),
-            )
-            no_context_decl = self.sig.decl(include_context=False)
-            self.assertEqual(
-                no_context_decl,
-                (
-                    "torch::executor::Tensor & foo_outf("
-                    "const torch::executor::Tensor & input, "
-                    "torch::executor::Tensor & out)"
-                ),
-            )
diff --git a/tools/test/test_executorch_types.py b/tools/test/test_executorch_types.py
deleted file mode 100644
index dedb19e21f3..00000000000
--- a/tools/test/test_executorch_types.py
+++ /dev/null
@@ -1,114 +0,0 @@
-import unittest
-
-from torchgen import local
-from torchgen.api.types import (
-    BaseCType,
-    boolT,
-    ConstRefCType,
-    CType,
-    longT,
-    MutRefCType,
-    NamedCType,
-    OptionalCType,
-    TupleCType,
-    VectorCType,
-    voidT,
-)
-from torchgen.executorch.api.et_cpp import argument_type, return_type, returns_type
-from torchgen.executorch.api.types import ArrayRefCType, scalarT, tensorListT, tensorT
-from torchgen.model import Argument, FunctionSchema, Return
-
-
-class ExecutorchCppTest(unittest.TestCase):
-    """
-    Test torchgen.executorch.api.cpp
-    """
-
-    def _test_argumenttype_type(self, arg_str: str, expected: NamedCType) -> None:
-        arg = Argument.parse(arg_str)
-        self.assertEqual(str(argument_type(arg, binds=arg.name)), str(expected))
-
-    @local.parametrize(
-        use_const_ref_for_mutable_tensors=False, use_ilistref_for_tensor_lists=False
-    )
-    def test_argumenttype_type(self) -> None:
-        data = [
-            ("Tensor self", NamedCType("self", ConstRefCType(BaseCType(tensorT)))),
-            ("Tensor(a!) out", NamedCType("out", MutRefCType(BaseCType(tensorT)))),
-            (
-                "Tensor? opt",
-                NamedCType("opt", ConstRefCType(OptionalCType(BaseCType(tensorT)))),
-            ),
-            ("Scalar scalar", NamedCType("scalar", ConstRefCType(BaseCType(scalarT)))),
-            (
-                "Scalar? scalar",
-                NamedCType("scalar", ConstRefCType(OptionalCType(BaseCType(scalarT)))),
-            ),
-            ("int[] size", NamedCType("size", ArrayRefCType(BaseCType(longT)))),
-            ("int? dim", NamedCType("dim", OptionalCType(BaseCType(longT)))),
-            ("Tensor[] weight", NamedCType("weight", BaseCType(tensorListT))),
-            (
-                "Scalar[] spacing",
-                NamedCType("spacing", ArrayRefCType(ConstRefCType(BaseCType(scalarT)))),
-            ),
-            (
-                "Tensor?[] weight",
-                NamedCType("weight", ArrayRefCType(OptionalCType(BaseCType(tensorT)))),
-            ),
-            (
-                "SymInt[]? output_size",
-                NamedCType(
-                    "output_size", OptionalCType(ArrayRefCType(BaseCType(longT)))
-                ),
-            ),
-            (
-                "int[]? dims",
-                NamedCType("dims", OptionalCType(ArrayRefCType(BaseCType(longT)))),
-            ),
-            (
-                "bool[3] output_mask",
-                NamedCType("output_mask", ArrayRefCType(BaseCType(boolT))),
-            ),
-        ]
-        for d in data:
-            self._test_argumenttype_type(*d)
-
-    def _test_returntype_type(self, ret_str: str, expected: CType) -> None:
-        ret = Return.parse(ret_str)
-        self.assertEqual(str(return_type(ret)), str(expected))
-
-    @local.parametrize(
-        use_const_ref_for_mutable_tensors=False, use_ilistref_for_tensor_lists=False
-    )
-    def test_returntype_type(self) -> None:
-        data = [
-            ("Tensor", BaseCType(tensorT)),
-            ("Tensor(a!)", MutRefCType(BaseCType(tensorT))),
-            ("Tensor[]", VectorCType(BaseCType(tensorT))),
-        ]
-        for d in data:
-            self._test_returntype_type(*d)
-
-    @local.parametrize(
-        use_const_ref_for_mutable_tensors=False, use_ilistref_for_tensor_lists=False
-    )
-    def test_returns_type(self) -> None:
-        func = FunctionSchema.parse(
-            "min.dim(Tensor self, int dim, bool keepdim=False) -> (Tensor values, Tensor indices)"
-        )
-        expected = TupleCType([BaseCType(tensorT), BaseCType(tensorT)])
-        self.assertEqual(str(returns_type(func.returns)), str(expected))
-
-    @local.parametrize(
-        use_const_ref_for_mutable_tensors=False, use_ilistref_for_tensor_lists=False
-    )
-    def test_void_return_type(self) -> None:
-        func = FunctionSchema.parse(
-            "_foreach_add_.Scalar(Tensor(a!)[] self, Scalar scalar) -> ()"
-        )
-        expected = BaseCType(voidT)
-        self.assertEqual(str(returns_type(func.returns)), str(expected))
-
-
-if __name__ == "__main__":
-    unittest.main()
diff --git a/tools/test/test_executorch_unboxing.py b/tools/test/test_executorch_unboxing.py
deleted file mode 100644
index eff0145856d..00000000000
--- a/tools/test/test_executorch_unboxing.py
+++ /dev/null
@@ -1,176 +0,0 @@
-import unittest
-from types import ModuleType
-
-from torchgen import local
-from torchgen.api import cpp as aten_cpp, types as aten_types
-from torchgen.api.types import (
-    ArgName,
-    BaseCType,
-    ConstRefCType,
-    MutRefCType,
-    NamedCType,
-)
-from torchgen.executorch.api import et_cpp as et_cpp, types as et_types
-from torchgen.executorch.api.unboxing import Unboxing
-from torchgen.model import BaseTy, BaseType, ListType, OptionalType, Type
-
-
-def aten_argumenttype_type_wrapper(
-    t: Type, *, mutable: bool, binds: ArgName, remove_non_owning_ref_types: bool = False
-) -> NamedCType:
-    return aten_cpp.argumenttype_type(
-        t,
-        mutable=mutable,
-        binds=binds,
-        remove_non_owning_ref_types=remove_non_owning_ref_types,
-    )
-
-
-ATEN_UNBOXING = Unboxing(argument_type_gen=aten_argumenttype_type_wrapper)
-ET_UNBOXING = Unboxing(argument_type_gen=et_cpp.argumenttype_type)
-
-
-class TestUnboxing(unittest.TestCase):
-    """
-    Could use torch.testing._internal.common_utils to reduce boilerplate.
-    GH CI job doesn't build torch before running tools unit tests, hence
-    manually adding these parametrized tests.
-    """
-
-    @local.parametrize(
-        use_const_ref_for_mutable_tensors=False, use_ilistref_for_tensor_lists=False
-    )
-    def test_symint_argument_translate_ctype_aten(self) -> None:
-        # test if `SymInt[]` JIT argument can be translated into C++ argument correctly.
-        # should be `IntArrayRef` due to the fact that Executorch doesn't use symint sig.
-
-        # pyre-fixme[16]: `enum.Enum` has no attribute `SymInt`
-        # pyre-fixme[19]: Call `BaseType.__init__` expects 0 positional arguments, 1 was provided.
-        symint_list_type = ListType(elem=BaseType(BaseTy.SymInt), size=None)
-
-        out_name, ctype, _, _ = ATEN_UNBOXING.argumenttype_evalue_convert(
-            t=symint_list_type, arg_name="size", mutable=False
-        )
-
-        self.assertEqual(out_name, "size_list_out")
-        self.assertIsInstance(ctype, BaseCType)
-        # pyre-fixme[16]:
-        self.assertEqual(ctype, aten_types.BaseCType(aten_types.intArrayRefT))
-
-    @local.parametrize(
-        use_const_ref_for_mutable_tensors=False, use_ilistref_for_tensor_lists=False
-    )
-    def test_symint_argument_translate_ctype_executorch(self) -> None:
-        # test if `SymInt[]` JIT argument can be translated into C++ argument correctly.
-        # should be `IntArrayRef` due to the fact that Executorch doesn't use symint sig.
-
-        # pyre-fixme[16]: `enum.Enum` has no attribute `SymInt`
-        # pyre-fixme[19]: Call `BaseType.__init__` expects 0 positional arguments, 1 was provided.
-        symint_list_type = ListType(elem=BaseType(BaseTy.SymInt), size=None)
-
-        out_name, ctype, _, _ = ET_UNBOXING.argumenttype_evalue_convert(
-            t=symint_list_type, arg_name="size", mutable=False
-        )
-
-        self.assertEqual(out_name, "size_list_out")
-        self.assertIsInstance(ctype, et_types.ArrayRefCType)
-        # pyre-fixme[16]:
-        self.assertEqual(
-            ctype, et_types.ArrayRefCType(elem=BaseCType(aten_types.longT))
-        )
-
-    @local.parametrize(
-        use_const_ref_for_mutable_tensors=False, use_ilistref_for_tensor_lists=False
-    )
-    def _test_const_tensor_argument_translate_ctype(
-        self, unboxing: Unboxing, types: ModuleType
-    ) -> None:
-        # pyre-fixme[16]: `enum.Enum` has no attribute `Tensor`
-        # pyre-fixme[19]: Call `BaseType.__init__` expects 0 positional arguments, 1 was provided.
-        tensor_type = BaseType(BaseTy.Tensor)
-
-        out_name, ctype, _, _ = unboxing.argumenttype_evalue_convert(
-            t=tensor_type, arg_name="self", mutable=False
-        )
-
-        self.assertEqual(out_name, "self_base")
-        # pyre-fixme[16]:
-        self.assertEqual(ctype, ConstRefCType(BaseCType(types.tensorT)))
-
-    def test_const_tensor_argument_translate_ctype_aten(self) -> None:
-        self._test_const_tensor_argument_translate_ctype(ATEN_UNBOXING, aten_types)
-
-    def test_const_tensor_argument_translate_ctype_executorch(self) -> None:
-        self._test_const_tensor_argument_translate_ctype(ET_UNBOXING, et_types)
-
-    @local.parametrize(
-        use_const_ref_for_mutable_tensors=False, use_ilistref_for_tensor_lists=False
-    )
-    def _test_mutable_tensor_argument_translate_ctype(
-        self, unboxing: Unboxing, types: ModuleType
-    ) -> None:
-        # pyre-fixme[16]: `enum.Enum` has no attribute `Tensor`
-        # pyre-fixme[19]: Call `BaseType.__init__` expects 0 positional arguments, 1 was provided.
-        tensor_type = BaseType(BaseTy.Tensor)
-
-        out_name, ctype, _, _ = unboxing.argumenttype_evalue_convert(
-            t=tensor_type, arg_name="out", mutable=True
-        )
-
-        self.assertEqual(out_name, "out_base")
-        # pyre-fixme[16]:
-        self.assertEqual(ctype, MutRefCType(BaseCType(types.tensorT)))
-
-    def test_mutable_tensor_argument_translate_ctype_aten(self) -> None:
-        self._test_mutable_tensor_argument_translate_ctype(ATEN_UNBOXING, aten_types)
-
-    def test_mutable_tensor_argument_translate_ctype_executorch(self) -> None:
-        self._test_mutable_tensor_argument_translate_ctype(ET_UNBOXING, et_types)
-
-    @local.parametrize(
-        use_const_ref_for_mutable_tensors=False, use_ilistref_for_tensor_lists=False
-    )
-    def _test_tensor_list_argument_translate_ctype(
-        self, unboxing: Unboxing, types: ModuleType
-    ) -> None:
-        # pyre-fixme[16]: `enum.Enum` has no attribute `Tensor`
-        # pyre-fixme[19]: Call `BaseType.__init__` expects 0 positional arguments, 1 was provided.
-        tensor_list_type = ListType(elem=BaseType(BaseTy.Tensor), size=None)
-
-        out_name, ctype, _, _ = unboxing.argumenttype_evalue_convert(
-            t=tensor_list_type, arg_name="out", mutable=True
-        )
-
-        self.assertEqual(out_name, "out_list_out")
-        # pyre-fixme[16]:
-        self.assertEqual(ctype, BaseCType(types.tensorListT))
-
-    def test_tensor_list_argument_translate_ctype_aten(self) -> None:
-        self._test_tensor_list_argument_translate_ctype(ATEN_UNBOXING, aten_types)
-
-    def test_tensor_list_argument_translate_ctype_executorch(self) -> None:
-        self._test_tensor_list_argument_translate_ctype(ET_UNBOXING, et_types)
-
-    @local.parametrize(
-        use_const_ref_for_mutable_tensors=False, use_ilistref_for_tensor_lists=False
-    )
-    def _test_optional_int_argument_translate_ctype(
-        self, unboxing: Unboxing, types: ModuleType
-    ) -> None:
-        # pyre-fixme[16]: `enum.Enum` has no attribute `Tensor`
-        # pyre-fixme[19]: Call `BaseType.__init__` expects 0 positional arguments, 1 was provided.
-        optional_int_type = OptionalType(elem=BaseType(BaseTy.int))
-
-        out_name, ctype, _, _ = unboxing.argumenttype_evalue_convert(
-            t=optional_int_type, arg_name="something", mutable=True
-        )
-
-        self.assertEqual(out_name, "something_opt_out")
-        # pyre-fixme[16]:
-        self.assertEqual(ctype, types.OptionalCType(BaseCType(types.longT)))
-
-    def test_optional_int_argument_translate_ctype_aten(self) -> None:
-        self._test_optional_int_argument_translate_ctype(ATEN_UNBOXING, aten_types)
-
-    def test_optional_int_argument_translate_ctype_executorch(self) -> None:
-        self._test_optional_int_argument_translate_ctype(ET_UNBOXING, et_types)
diff --git a/tools/test/test_selective_build.py b/tools/test/test_selective_build.py
index 59e6e617072..fac6ca6c8b5 100644
--- a/tools/test/test_selective_build.py
+++ b/tools/test/test_selective_build.py
@@ -298,45 +298,3 @@ operators:
             valid_tags=set(),
         )
         self.assertTrue(selector.is_native_function_selected(native_function))
-
-
-class TestExecuTorchSelectiveBuild(unittest.TestCase):
-    def test_et_kernel_selected(self) -> None:
-        yaml_config = """
-et_kernel_metadata:
-  aten::add.out:
-   - "v1/6;0,1|6;0,1|6;0,1|6;0,1"
-  aten::sub.out:
-   - "v1/6;0,1|6;0,1|6;0,1|6;0,1"
-"""
-        selector = SelectiveBuilder.from_yaml_str(yaml_config)
-        self.assertListEqual(
-            ["v1/6;0,1|6;0,1|6;0,1|6;0,1"],
-            selector.et_get_selected_kernels(
-                "aten::add.out",
-                [
-                    "v1/6;0,1|6;0,1|6;0,1|6;0,1",
-                    "v1/3;0,1|3;0,1|3;0,1|3;0,1",
-                    "v1/6;1,0|6;0,1|6;0,1|6;0,1",
-                ],
-            ),
-        )
-        self.assertListEqual(
-            ["v1/6;0,1|6;0,1|6;0,1|6;0,1"],
-            selector.et_get_selected_kernels(
-                "aten::sub.out", ["v1/6;0,1|6;0,1|6;0,1|6;0,1"]
-            ),
-        )
-        self.assertListEqual(
-            [],
-            selector.et_get_selected_kernels(
-                "aten::mul.out", ["v1/6;0,1|6;0,1|6;0,1|6;0,1"]
-            ),
-        )
-        # We don't use version for now.
-        self.assertListEqual(
-            ["v2/6;0,1|6;0,1|6;0,1|6;0,1"],
-            selector.et_get_selected_kernels(
-                "aten::add.out", ["v2/6;0,1|6;0,1|6;0,1|6;0,1"]
-            ),
-        )
diff --git a/torchgen/build.bzl b/torchgen/build.bzl
index 2ec68955df9..50765869f8d 100644
--- a/torchgen/build.bzl
+++ b/torchgen/build.bzl
@@ -18,13 +18,3 @@ def define_targets(rules):
             rules.requirement("typing-extensions"),
         ],
     )
-
-    rules.py_binary(
-        name = "gen_executorch",
-        srcs = [":torchgen"],
-        visibility = ["//visibility:public"],
-        deps = [
-            rules.requirement("PyYAML"),
-            rules.requirement("typing-extensions"),
-        ],
-    )
diff --git a/torchgen/executorch/__init__.py b/torchgen/executorch/__init__.py
deleted file mode 100644
index e69de29bb2d..00000000000
diff --git a/torchgen/executorch/api/__init__.py b/torchgen/executorch/api/__init__.py
deleted file mode 100644
index e69de29bb2d..00000000000
diff --git a/torchgen/executorch/api/custom_ops.py b/torchgen/executorch/api/custom_ops.py
deleted file mode 100644
index 641b7e9c941..00000000000
--- a/torchgen/executorch/api/custom_ops.py
+++ /dev/null
@@ -1,151 +0,0 @@
-from __future__ import annotations
-
-from collections import defaultdict
-from dataclasses import dataclass
-from typing import TYPE_CHECKING
-
-from torchgen import dest
-
-
-# disable import sorting to avoid circular dependency.
-from torchgen.api.types import DispatcherSignature  # usort: skip
-from torchgen.context import method_with_native_function
-from torchgen.model import BaseTy, BaseType, DispatchKey, NativeFunction, Variant
-from torchgen.utils import concatMap, Target
-
-
-if TYPE_CHECKING:
-    from collections.abc import Sequence
-
-    from torchgen.executorch.model import ETKernelIndex
-    from torchgen.selective_build.selector import SelectiveBuilder
-
-
-# Generates RegisterKernelStub.cpp, which provides placeholder kernels for custom operators. This will be used at
-# model authoring side.
-@dataclass(frozen=True)
-class ComputeNativeFunctionStub:
-    @method_with_native_function
-    def __call__(self, f: NativeFunction) -> str | None:
-        if Variant.function not in f.variants:
-            return None
-
-        sig = DispatcherSignature.from_schema(
-            f.func, prefix=f"wrapper_CPU_{f.func.name.overload_name}_", symint=False
-        )
-        assert sig is not None
-        if len(f.func.returns) == 0:
-            ret_name = ""
-        elif len(f.func.returns) == 1:
-            if f.func.arguments.out:
-                ret_name = f.func.arguments.out[0].name
-            else:
-                ret_name = next(
-                    (
-                        a.name
-                        for a in f.func.arguments.flat_non_out
-                        if a.type == f.func.returns[0].type
-                    ),
-                    "",
-                )
-            if not ret_name:
-                # if return type is tensor
-                if f.func.returns[0].type == BaseType(BaseTy.Tensor):
-                    # Returns an empty tensor
-                    ret_name = "at::Tensor()"
-                else:
-                    raise Exception(  # noqa: TRY002
-                        f"Can't handle this return type {f.func}"
-                    )  # noqa: TRY002
-        elif len(f.func.arguments.out) == len(f.func.returns):
-            # Returns a tuple of out arguments
-            tensor_type = "at::Tensor &"
-            comma = ", "
-            ret_name = f"""::std::tuple<{comma.join([tensor_type] * len(f.func.returns))}>(
-                {comma.join([r.name for r in f.func.arguments.out])}
-            )"""
-        else:
-            assert all(a.type == BaseType(BaseTy.Tensor) for a in f.func.returns), (
-                f"Only support tensor returns but got {f.func.returns}"
-            )
-            # Returns a tuple of empty tensors
-            tensor_type = "at::Tensor"
-            comma = ", "
-            ret_name = f"""::std::tuple<{comma.join([tensor_type] * len(f.func.returns))}>(
-                {comma.join(["at::Tensor()" for _ in f.func.returns])}
-            )"""
-        ret_str = f"return {ret_name};" if len(f.func.returns) > 0 else ""
-        return f"""
-{sig.defn()} {{
-    {ret_str}
-}}
-    """
-
-
-def gen_custom_ops_registration(
-    *,
-    native_functions: Sequence[NativeFunction],
-    selector: SelectiveBuilder,
-    kernel_index: ETKernelIndex,
-    rocm: bool,
-) -> tuple[str, str]:
-    """
-    Generate custom ops registration code for dest.RegisterDispatchKey.
-
-    :param native_functions: a sequence of `NativeFunction`
-    :param selector: for selective build.
-    :param kernel_index: kernels for all the ops.
-    :param rocm: bool for dest.RegisterDispatchKey.
-    :return: generated C++ code to register custom operators into PyTorch
-    """
-
-    # convert kernel index to BackendIndex. This is because we can't handle ETKernelIndex yet.
-    # TODO larryliu: evaluate if this code is still needed. If yes let it handle ETKernelIndex.
-
-    dispatch_key = DispatchKey.CPU
-    backend_index = kernel_index._to_backend_index()
-    static_init_dispatch_registrations = ""
-    ns_grouped_native_functions: dict[str, list[NativeFunction]] = defaultdict(list)
-    for native_function in native_functions:
-        ns_grouped_native_functions[native_function.namespace].append(native_function)
-
-    for namespace, functions in ns_grouped_native_functions.items():
-        if len(functions) == 0:
-            continue
-        dispatch_registrations_body = "\n".join(
-            list(
-                concatMap(
-                    dest.RegisterDispatchKey(
-                        backend_index,
-                        Target.REGISTRATION,
-                        selector,
-                        rocm=rocm,
-                        symint=False,
-                        class_method_name=None,
-                        skip_dispatcher_op_registration=False,
-                    ),
-                    functions,
-                )
-            )
-        )
-        static_init_dispatch_registrations += f"""
-TORCH_LIBRARY_IMPL({namespace}, {dispatch_key}, m) {{
-{dispatch_registrations_body}
-}}"""
-    anonymous_definition = "\n".join(
-        list(
-            concatMap(
-                dest.RegisterDispatchKey(
-                    backend_index,
-                    Target.ANONYMOUS_DEFINITION,
-                    selector,
-                    rocm=rocm,
-                    symint=False,
-                    class_method_name=None,
-                    skip_dispatcher_op_registration=False,
-                ),
-                native_functions,
-            )
-        )
-    )
-    return anonymous_definition, static_init_dispatch_registrations
diff --git a/torchgen/executorch/api/et_cpp.py b/torchgen/executorch/api/et_cpp.py
deleted file mode 100644
index 081a3d4ece1..00000000000
--- a/torchgen/executorch/api/et_cpp.py
+++ /dev/null
@@ -1,367 +0,0 @@
-from __future__ import annotations
-
-from typing import TYPE_CHECKING
-from typing_extensions import assert_never
-
-from torchgen import local
-from torchgen.api.types import (
-    ArgName,
-    BaseCType,
-    Binding,
-    ConstRefCType,
-    CType,
-    MutRefCType,
-    NamedCType,
-    SpecialArgName,
-    TupleCType,
-    VectorCType,
-    voidT,
-)
-from torchgen.executorch.api.types import (
-    ArrayRefCType,
-    BaseTypeToCppMapping,
-    OptionalCType,
-    scalarT,
-    tensorListT,
-    tensorT,
-)
-from torchgen.model import (
-    Argument,
-    Arguments,
-    BaseTy,
-    BaseType,
-    ListType,
-    NativeFunction,
-    OptionalType,
-    Return,
-    SelfArgument,
-    TensorOptionsArguments,
-    Type,
-)
-
-
-if TYPE_CHECKING:
-    from collections.abc import Sequence
-
-
-"""
-This file describes the translation of JIT schema to the public C++ API, which is what people use when they call
-functions like at::add. It also serves as a native function API, which is the signature of kernels,
-since in Executorch CppSignature is the same as NativeSignature.
-
-Difference between this file and torchgen.api.cpp.py:
-
-  - Executorch doesn't support TensorOptions, however in this file we still keep the logic here to be compatible with
-    torchgen.api.cpp, so that we can do stuff like ATen mode (running ATen kernels in Executorch).
-
-  - Executorch doesn't support Dimname.
-
-  - Executorch runtime doesn't support SymInt, will treat it as int.
-"""
-
-
-# Translation of "value types" in JIT schema to C++ API type.  Value
-# types look the same no matter if they are argument types or return
-# types.  Returns None if the type in question is not a value type.
-def valuetype_type(
-    t: Type,
-    *,
-    binds: ArgName,
-) -> NamedCType | None:
-    if isinstance(t, BaseType):
-        if t.name == BaseTy.Tensor or t.name == BaseTy.Scalar:
-            return None
-        # For SymInt we simply treat it as int.
-        elif str(t) == "SymInt":
-            return NamedCType(binds, BaseCType(BaseTypeToCppMapping[BaseTy.int]))
-        # All other BaseType currently map directly to BaseCppTypes.
-        return NamedCType(binds, BaseCType(BaseTypeToCppMapping[t.name]))
-    elif isinstance(t, OptionalType):
-        elem = valuetype_type(t.elem, binds=binds)
-        if elem is None:
-            return None
-        return NamedCType(binds, OptionalCType(elem.type))
-    elif isinstance(t, ListType):
-        if str(t.elem) == "bool":
-            assert t.size is not None
-            return NamedCType(
-                binds, ArrayRefCType(BaseCType(BaseTypeToCppMapping[BaseTy.bool]))
-            )
-        else:
-            return None
-    else:
-        raise AssertionError(f"unrecognized type {repr(t)}")
-
-
-# Translation of types occurring in JIT arguments to a C++ argument type.
-# If remove_non_owning_ref_types is set, we'll guarantee that the outputed CType is not a non-owning reference type.
-# For example, we'll return std::vector<int> instead of IntArrayRef.
-# See Note [translation from C++ reference to value types]
-def argumenttype_type(
-    t: Type,
-    *,
-    mutable: bool,
-    binds: ArgName,
-    remove_non_owning_ref_types: bool = False,
-) -> NamedCType:
-    # If it's a value type, do the value type translation
-    r = valuetype_type(
-        t,
-        binds=binds,
-    )
-    if r is not None:
-        return r
-    if isinstance(t, BaseType):
-        if t.name == BaseTy.Tensor:
-            if mutable and not local.use_const_ref_for_mutable_tensors():
-                return NamedCType(binds, MutRefCType(BaseCType(tensorT)))
-            else:
-                return NamedCType(binds, ConstRefCType(BaseCType(tensorT)))
-        elif t.name == BaseTy.Scalar:
-            return NamedCType(binds, ConstRefCType(BaseCType(scalarT)))
-        else:
-            raise AssertionError(f"base type should have been value type {t}")
-    elif isinstance(t, OptionalType):
-        if str(t.elem) == "Tensor":
-            if mutable and not local.use_const_ref_for_mutable_tensors():
-                return NamedCType(
-                    binds, MutRefCType(BaseCType(tensorT))
-                )  # TODO: fix this discrepancy
-            else:
-                return NamedCType(
-                    binds, ConstRefCType(OptionalCType(BaseCType(tensorT)))
-                )
-        elif str(t.elem) == "Scalar":
-            return NamedCType(binds, ConstRefCType(OptionalCType(BaseCType(scalarT))))
-        elem = argumenttype_type(t.elem, mutable=mutable, binds=binds)
-        return NamedCType(binds, OptionalCType(elem.type))
-    elif isinstance(t, ListType):
-        # TODO: keeping these special cases for Tensor[] and Tensor?[] so that we can hookup with ATen kernels.
-        if str(t.elem) == "Tensor":
-            return NamedCType(binds, BaseCType(tensorListT))
-        elif str(t.elem) == "Dimname":
-            raise NotImplementedError("Executorch doesn't support Dimname")
-        elif str(t.elem) == "Tensor?":
-            return NamedCType(binds, ArrayRefCType(OptionalCType(BaseCType(tensorT))))
-        elem = argumenttype_type(t.elem, mutable=mutable, binds=binds)
-        return NamedCType(binds, ArrayRefCType(elem.type))
-    else:
-        raise AssertionError(f"unrecognized type {repr(t)}")
-
-
-# Translate a JIT argument into its C++ type
-def argument_type(a: Argument, *, binds: ArgName) -> NamedCType:
-    return argumenttype_type(a.type, mutable=a.is_write, binds=binds)
-
-
-# Translation of a (non-multi) return type from JIT to C++
-# N.B: returntype_type returns a CType, not a NamedCType.
-# This is mostly because of the mismatch between return types and return names.
-# e.g. a function with a return type of 'void' has 0 return names,
-# and a function with a return type of 'std::tuple' has >1 return name.
-def returntype_type(t: Type, *, mutable: bool) -> CType:
-    # placeholder is ignored
-    r = valuetype_type(t, binds="__placeholder__")
-    if r is not None:
-        return r.type
-
-    if isinstance(t, BaseType):
-        if t.name == BaseTy.Tensor:
-            if mutable:
-                if local.use_const_ref_for_mutable_tensors():
-                    return ConstRefCType(BaseCType(tensorT))
-                else:
-                    return MutRefCType(BaseCType(tensorT))
-            else:
-                # Note [Tensor Copy Returns]
-                # Currently, we use "Argument.is_write" to determine
-                # whether or not Tensor return types should be copies or references.
-                # If that ever changes, take a look at other locations of this note!
-                return BaseCType(tensorT)
-        elif t.name == BaseTy.Scalar:
-            return BaseCType(scalarT)
-    elif isinstance(t, ListType):
-        assert not mutable, (
-            "Native functions should never return a mutable tensor list. They should return void."
-        )
-        elem = returntype_type(t.elem, mutable=False)
-        assert t.size is None, f"fixed size list returns not supported: {t}"
-        return VectorCType(elem)
-
-    raise AssertionError(f"unrecognized return type {t}")
-
-
-# Translation of a single return to its C++ type
-def return_type(r: Return) -> CType:
-    return returntype_type(r.type, mutable=r.is_write)
-
-
-# Translation of a full (possibly multi) return from JIT to its C++ type
-def returns_type(rs: Sequence[Return]) -> CType:
-    if len(rs) == 0:
-        return BaseCType(voidT)
-    elif len(rs) == 1:
-        return return_type(rs[0])
-    else:
-        return TupleCType([return_type(r) for r in rs])
-
-
-def return_names(f: NativeFunction, *, fallback_name: str = "result") -> Sequence[str]:
-    returns: list[str] = []
-    for i, r in enumerate(f.func.returns):
-        # If we have an inplace function, the return argument is
-        # implicitly named self.
-        # TODO: Consider incorporating this into the data model
-        if f.func.name.name.inplace:
-            assert i == 0, "illegal inplace function with multiple returns"
-            name = "self"
-        # If we are out function, the name is the name of the
-        # corresponding output function (r.name will get recorded
-        # in field_name later.)
-        elif f.func.is_out_fn():
-            name = f.func.arguments.out[i].name
-        # If the return argument is explicitly named...
-        elif r.name:
-            name_conflict = any(
-                r.name == a.name for a in f.func.schema_order_arguments()
-            )
-            if name_conflict and not f.func.is_out_fn():
-                name = f"{r.name}_return"
-            else:
-                name = r.name
-        # If there is no explicit name and no fallback name was passed in, we just name the output result,
-        # unless it's a multi-return, in which case it's result0,
-        # result1, etc (zero-indexed)
-        else:
-            name = fallback_name if len(f.func.returns) == 1 else f"{fallback_name}{i}"
-        returns.append(name)
-    return returns
-
-
-JIT_TO_CPP_DEFAULT = {
-    "False": "false",
-    "True": "true",
-    "None": "torch::execustd::nullopt",  # UGH this one is type directed
-    "[]": "{}",
-    "contiguous_format": "torch::executorch::MemoryFormat::Contiguous",
-    "long": "torch::executorch::kLong",
-}
-
-
-# Convert a JIT default into C++ expression representing the default
-def default_expr(d: str, t: Type) -> str:
-    if d == "None" and str(t) == "Tensor?":
-        return "{}"
-    if isinstance(t, BaseType) and t.name is BaseTy.str:
-        # Schema allows single quotes but C++ needs double
-        if len(d) >= 2 and d[0] == "'" and d[-1] == "'":
-            s = ""
-            i = 1
-            while i + 1 < len(d):
-                if d[i] != "\\":
-                    if d[i] == '"':
-                        s += '\\"'
-                    else:
-                        s += d[i]
-                    i += 1
-                else:
-                    if d[i + 1] == "'":
-                        s += "'"
-                    else:
-                        s += d[i : i + 2]
-                    i += 2
-
-            return f'"{s}"'
-
-    if isinstance(t, OptionalType):
-        if d == "None":
-            return "torch::executor::nullopt"
-
-        return default_expr(d, t.elem)
-
-    if isinstance(t, ListType):
-        if d.startswith("[") and d.endswith("]"):
-            return "{" + d[1:-1] + "}"
-        elif t.size is None:
-            # NOTE: Sized lists can have scalar defaults
-            raise ValueError(f"Expected a list default '[...]' but found: '{d}'")
-
-    return JIT_TO_CPP_DEFAULT.get(d, d)
-
-
-# Convert an argument into its C++ API form
-
-
-def argument(
-    a: Argument | TensorOptionsArguments | SelfArgument,
-    *,
-    cpp_no_default_args: set[str],
-    method: bool,
-    faithful: bool,
-    has_tensor_options: bool,
-) -> list[Binding]:
-    def sub_argument(
-        a: Argument | TensorOptionsArguments | SelfArgument,
-    ) -> list[Binding]:
-        return argument(
-            a,
-            cpp_no_default_args=cpp_no_default_args,
-            method=method,
-            faithful=faithful,
-            has_tensor_options=has_tensor_options,
-        )
-
-    if isinstance(a, Argument):
-        binds: ArgName
-        if a.name == "memory_format" and has_tensor_options:
-            binds = SpecialArgName.possibly_redundant_memory_format
-        else:
-            binds = a.name
-        default: str | None = None
-        if a.name not in cpp_no_default_args and a.default is not None:
-            default = default_expr(a.default, a.type)
-        return [
-            Binding(
-                nctype=argument_type(a, binds=binds),
-                name=a.name,
-                default=default,
-                argument=a,
-            )
-        ]
-    elif isinstance(a, TensorOptionsArguments):
-        raise NotImplementedError("Need to implement type resolution for TensorOptions")
-    elif isinstance(a, SelfArgument):
-        if method:
-            # Caller is responsible for installing implicit this in context!
-            return []
-        else:
-            return sub_argument(a.argument)
-    else:
-        assert_never(a)
-
-
-def arguments(
-    arguments: Arguments,
-    *,
-    faithful: bool,
-    method: bool,
-    cpp_no_default_args: set[str],
-) -> list[Binding]:
-    args: list[Argument | TensorOptionsArguments | SelfArgument] = []
-    if faithful:
-        args.extend(arguments.non_out)
-        args.extend(arguments.out)
-    else:
-        args.extend(arguments.out)
-        args.extend(arguments.non_out)
-    return [
-        r.no_default() if faithful else r
-        for a in args
-        for r in argument(
-            a,
-            faithful=faithful,
-            method=method,
-            has_tensor_options=arguments.tensor_options is not None,
-            cpp_no_default_args=cpp_no_default_args,
-        )
-    ]
diff --git a/torchgen/executorch/api/types/__init__.py b/torchgen/executorch/api/types/__init__.py
deleted file mode 100644
index 08cb168df73..00000000000
--- a/torchgen/executorch/api/types/__init__.py
+++ /dev/null
@@ -1,4 +0,0 @@
-from torchgen.executorch.api.types.types import *
-
-
-from torchgen.executorch.api.types.signatures import *  # usort: skip
diff --git a/torchgen/executorch/api/types/signatures.py b/torchgen/executorch/api/types/signatures.py
deleted file mode 100644
index ac3477cede6..00000000000
--- a/torchgen/executorch/api/types/signatures.py
+++ /dev/null
@@ -1,76 +0,0 @@
-from __future__ import annotations
-
-from dataclasses import dataclass
-from typing import TYPE_CHECKING
-
-import torchgen.api.cpp as aten_cpp
-from torchgen.executorch.api.types.types import contextArg
-
-
-if TYPE_CHECKING:
-    from torchgen.api.types import Binding, CType
-    from torchgen.model import FunctionSchema, NativeFunction
-
-
-@dataclass(frozen=True)
-class ExecutorchCppSignature:
-    """
-    This signature is merely a CppSignature with Executorch types (optionally
-    contains KernelRuntimeContext as well). The inline definition of
-    CppSignature is generated in Functions.h and it's used by unboxing
-    functions.
-    """
-
-    # The schema this signature is derived from
-    func: FunctionSchema
-
-    # The set of C++ arguments which should not have defaults applied to them
-    cpp_no_default_args: set[str]
-
-    # Allows you to prepend an arbitrary prefix to the signature name.
-    # This is useful for parts of the codegen that generate wrappers around kernels,
-    # and need to avoid naming collisions.
-    prefix: str = ""
-
-    def arguments(self, *, include_context: bool = True) -> list[Binding]:
-        return ([contextArg] if include_context else []) + et_cpp.arguments(
-            self.func.arguments,
-            faithful=True,  # always faithful, out argument at the end
-            method=False,  # method not supported
-            cpp_no_default_args=self.cpp_no_default_args,
-        )
-
-    def name(self) -> str:
-        return self.prefix + aten_cpp.name(
-            self.func,
-            faithful_name_for_out_overloads=True,
-        )
-
-    def decl(self, name: str | None = None, *, include_context: bool = True) -> str:
-        args_str = ", ".join(
-            a.decl() for a in self.arguments(include_context=include_context)
-        )
-        if name is None:
-            name = self.name()
-        return f"{self.returns_type().cpp_type()} {name}({args_str})"
-
-    def defn(self, name: str | None = None) -> str:
-        args = [a.defn() for a in self.arguments()]
-        args_str = ", ".join(args)
-        if name is None:
-            name = self.name()
-        return f"{self.returns_type().cpp_type()} {name}({args_str})"
-
-    def returns_type(self) -> CType:
-        return et_cpp.returns_type(self.func.returns)
-
-    @staticmethod
-    def from_native_function(
-        f: NativeFunction, *, prefix: str = ""
-    ) -> ExecutorchCppSignature:
-        return ExecutorchCppSignature(
-            func=f.func, prefix=prefix, cpp_no_default_args=f.cpp_no_default_args
-        )
-
-
-from torchgen.executorch.api import et_cpp
diff --git a/torchgen/executorch/api/types/types.py b/torchgen/executorch/api/types/types.py
deleted file mode 100644
index 712d7e5e341..00000000000
--- a/torchgen/executorch/api/types/types.py
+++ /dev/null
@@ -1,77 +0,0 @@
-from __future__ import annotations
-
-from dataclasses import dataclass
-
-from torchgen.api.types import (
-    BaseCppType,
-    BaseCType,
-    Binding,
-    boolT,
-    CType,
-    doubleT,
-    Expr,
-    longT,
-    MutRefCType,
-    NamedCType,
-)
-from torchgen.model import BaseTy
-
-
-halfT = BaseCppType("torch::executor", "Half")
-bfloat16T = BaseCppType("torch::executor", "BFloat16")
-stringT = BaseCppType("torch::executor", "string_view")
-scalarTypeT = BaseCppType("torch::executor", "ScalarType")
-tensorT = BaseCppType("torch::executor", "Tensor")
-tensorListT = BaseCppType("torch::executor", "TensorList")
-scalarT = BaseCppType("torch::executor", "Scalar")
-memoryFormatT = BaseCppType("torch::executor", "MemoryFormat")
-intArrayRefT = BaseCppType("torch::executor", "IntArrayRef")
-optionalT = BaseCppType("torch::executor", "optional")
-contextT = BaseCppType("torch::executor", "KernelRuntimeContext")
-
-contextExpr = Expr(
-    expr="context",
-    type=NamedCType(name="context", type=MutRefCType(BaseCType(contextT))),
-)
-
-contextArg = Binding(
-    name="context",
-    nctype=contextExpr.type,
-    argument=None,  # type: ignore[arg-type]
-    default=None,
-)
-
-BaseTypeToCppMapping: dict[BaseTy, BaseCppType] = {
-    BaseTy.int: longT,
-    BaseTy.float: doubleT,
-    BaseTy.bool: boolT,
-    BaseTy.str: stringT,
-    BaseTy.ScalarType: scalarTypeT,
-    BaseTy.Tensor: tensorT,
-    BaseTy.Scalar: scalarT,
-    BaseTy.MemoryFormat: memoryFormatT,
-}
-
-
-@dataclass(frozen=True)
-class OptionalCType(CType):
-    elem: CType
-
-    def cpp_type(self, *, strip_ref: bool = False) -> str:
-        # Do not pass `strip_ref` recursively.
-        return f"torch::executor::optional<{self.elem.cpp_type()}>"
-
-    def remove_const_ref(self) -> CType:
-        return OptionalCType(self.elem.remove_const_ref())
-
-
-@dataclass(frozen=True)
-class ArrayRefCType(CType):
-    elem: CType
-
-    def cpp_type(self, *, strip_ref: bool = False) -> str:
-        # Do not pass `strip_ref` recursively.
-        return f"torch::executor::ArrayRef<{self.elem.cpp_type()}>"
-
-    def remove_const_ref(self) -> CType:
-        return ArrayRefCType(self.elem.remove_const_ref())
diff --git a/torchgen/executorch/api/unboxing.py b/torchgen/executorch/api/unboxing.py
deleted file mode 100644
index 6d648f71511..00000000000
--- a/torchgen/executorch/api/unboxing.py
+++ /dev/null
@@ -1,218 +0,0 @@
-from __future__ import annotations
-
-from dataclasses import dataclass
-from typing import Callable, TYPE_CHECKING
-
-from torchgen.model import (
-    Argument,
-    BaseTy,
-    BaseType,
-    ListType,
-    NativeFunction,
-    OptionalType,
-    Type,
-)
-
-
-if TYPE_CHECKING:
-    from collections.abc import Sequence
-
-    from torchgen.api.types import Binding, CType, NamedCType
-
-
-connector = "\n\t"
-
-
-# Return unboxing function name for a NativeFunction
-def name(f: NativeFunction) -> str:
-    return f.func.name.unambiguous_name()
-
-
-@dataclass(frozen=True)
-class Unboxing:
-    """
-    Takes a sequence of Bindings and unbox EValues to these Bindings. Return generated code that performs correct unboxing.
-    A sample generated code:
-    // aten::mul.out(Tensor self, Tensor other, *, Tensor(a!) out) -> Tensor(a!)
-    void mul_out(EValue** stack) {
-        EValue& self = *stack[0];
-        EValue& other = *stack[1];
-        EValue& out = *stack[2];
-        const torch::executor::Tensor & self_base = self.to<torch::executor::Tensor>();
-        const torch::executor::Tensor & other_base = other.to<torch::executor::Tensor>();
-        torch::executor::Tensor & out_base = out.to<torch::executor::Tensor>();
-
-        EXECUTORCH_SCOPE_PROF("native_call_mul.out");
-        torch::executor::mul_outf(self_base, other_base, out_base);
-
-
-    }
-    """
-
-    # this is a callable that converts a JIT argument, into its C++ type.
-    # Translates (type, mutability, binds) to NamedCType. E.g., torchgen.api.cpp.argumenttype_type.
-    argument_type_gen: Callable[
-        ...,
-        NamedCType,
-    ]
-
-    # Convert all the arguments in a NativeFunction to C++ code
-    def convert_arguments(
-        self, args: Sequence[Binding]
-    ) -> tuple[list[Binding], list[str]]:
-        code_list = [f"EValue& {args[i].name} = *stack[{i}];" for i in range(len(args))]
-        binding_list = []
-        for arg in args:
-            # expecting only Argument
-            if not isinstance(arg.argument, Argument):
-                raise Exception(  # noqa: TRY002
-                    f"Unexpected argument type, expecting `Argument` but got {arg}"
-                )
-            argument: Argument = arg.argument
-            unboxed_name, _, code, decl = self.argumenttype_evalue_convert(
-                argument.type, argument.name, mutable=argument.is_write
-            )
-            code_list.extend(decl)
-            code_list.extend(code)
-            binding_list.append(arg.with_name(unboxed_name))
-        return binding_list, code_list
-
-    def argumenttype_evalue_convert(
-        self, t: Type, arg_name: str, *, mutable: bool = False
-    ) -> tuple[str, CType, list[str], list[str]]:
-        """
-        Takes in the type, name and mutability corresponding to an argument, and generates a tuple of:
-        (1) the C++ code necessary to unbox the argument
-        (2) A Binding corresponding to the newly created unboxed variable, including variable name and its CType
-        :param t: a `Type` of an argument
-        :param arg_name: argument name
-        :param mutable: boolean for whether this argument type is mutable
-        :return: unboxed result
-        """
-        ctype = self.argument_type_gen(t, mutable=mutable, binds=arg_name).type
-
-        if isinstance(t, BaseType):
-            out_name = f"{arg_name}_base"
-            code, decl = self._gen_code_base_type(
-                arg_name=arg_name, out_name=out_name, ctype=ctype
-            )
-        elif isinstance(t, OptionalType):
-            out_name = f"{arg_name}_opt_out"
-            code, decl = self._gen_code_optional_type(
-                arg_name=arg_name, out_name=out_name, t=t, ctype=ctype
-            )
-        elif isinstance(t, ListType):
-            out_name = f"{arg_name}_list_out"
-            code, decl = self._gen_code_list_type(
-                arg_name=arg_name, out_name=out_name, t=t, ctype=ctype
-            )
-        else:
-            raise Exception(  # noqa: TRY002
-                f"Cannot handle type {t}. arg_name: {arg_name}"
-            )  # noqa: TRY002
-        return out_name, ctype, code, decl
-
-    def _gen_code_base_type(
-        self, arg_name: str, out_name: str, ctype: CType
-    ) -> tuple[list[str], list[str]]:
-        return [
-            f"{ctype.cpp_type()} {out_name} = {arg_name}.to<{ctype.cpp_type(strip_ref=True)}>();"
-        ], []
-
-    def _gen_code_optional_type(
-        self, arg_name: str, out_name: str, t: OptionalType, ctype: CType
-    ) -> tuple[list[str], list[str]]:
-        in_name = f"{arg_name}_opt_in"
-        res_name, base_type, res_code, decl = self.argumenttype_evalue_convert(
-            t.elem, in_name
-        )
-        return (
-            f"""
-    auto {out_name} = {arg_name}.toOptional<{base_type.cpp_type(strip_ref=True)}>();
-            """.split("\n"),
-            decl,
-        )
-
-    def _gen_code_list_type(
-        self, arg_name: str, out_name: str, t: ListType, ctype: CType
-    ) -> tuple[list[str], list[str]]:
-        in_name = f"{arg_name}_list_in"
-        elem_name = f"{arg_name}_elem"
-        code = []
-        res_name, res_ctype, res_code, decl = self.argumenttype_evalue_convert(
-            t.elem, elem_name
-        )
-
-        if isinstance(t.elem, BaseType) and t.elem.name == BaseTy.Tensor:
-            code.extend(
-                f"""
-    auto {out_name} = {arg_name}.toTensorList();
-                """.split("\n")
-            )
-        elif isinstance(t.elem, BaseType) and (
-            t.elem.name == BaseTy.int or t.elem.name == BaseTy.SymInt
-        ):
-            code.extend(
-                f"""
-    auto {out_name} = {arg_name}.toIntList();
-                """.split("\n")
-            )
-        elif isinstance(t.elem, BaseType) and t.elem.name == BaseTy.float:
-            code.extend(
-                f"""
-    auto {out_name} = {arg_name}.toDoubleList();
-                """.split("\n")
-            )
-        elif isinstance(t.elem, BaseType) and t.elem.name == BaseTy.bool:
-            # handle list type with size, e.g., bool[4]
-            code.extend(
-                f"""
-#ifdef USE_ATEN_LIB
-std::array<bool, {t.size}> {out_name};
-auto {in_name} = {arg_name}.toBoolList();
-size_t _i = 0;
-for (auto {elem_name}: {in_name}) {{
-    {out_name}[_i++] = {elem_name};
-}}
-#else
-auto {out_name} = {arg_name}.toBoolList();
-#endif
-                """.split("\n")
-            )
-        # pytorch codegen:
-        # we have to use c10::List for optional element. e.g., Tensor?[] -> c10::List<::std::optional<at::Tensor>>
-        elif (
-            isinstance(t.elem, OptionalType)
-            and isinstance(t.elem.elem, BaseType)
-            and t.elem.elem.name == BaseTy.Tensor
-        ):
-            code.extend(
-                f"""
-#ifdef USE_ATEN_LIB
-auto {in_name} = {arg_name}.toListOptionalTensor();
-c10::List<::std::optional<at::Tensor>> {out_name};
-for (auto {elem_name}: {in_name}) {{
-    {out_name}.push_back({elem_name});
-}}
-#else
-auto {out_name} = {arg_name}.toListOptionalTensor();
-#endif
-                """.split("\n")
-            )
-        else:
-            # use ArrayRef as default.
-            vec_name = arg_name + "_vec"
-            # need to bring vector instantiation out of scope so that ArrayRef has valid data
-            decl.append(
-                f"std::vector<{res_ctype.cpp_type(strip_ref=True)}> {vec_name};"
-            )
-            code.extend(
-                f"""
-    for (EValue {elem_name}: {in_name}) {{
-        {connector.join(res_code)}
-        {vec_name}.push_back({res_name});
-    }}
-    {ctype.cpp_type(strip_ref=True)} {out_name}({vec_name});
-                """.split("\n")
-            )
-        return code, decl
diff --git a/torchgen/executorch/model.py b/torchgen/executorch/model.py
deleted file mode 100644
index 310c5968ec0..00000000000
--- a/torchgen/executorch/model.py
+++ /dev/null
@@ -1,220 +0,0 @@
-# Represents all kernels used by an Executorch model.
-# It maintains a dict[OperatorName, dict[ETKernelKey, BackendMetadata]] structure.
-
-from __future__ import annotations
-
-import itertools
-from collections import defaultdict, namedtuple
-from dataclasses import dataclass
-from enum import IntEnum
-from typing_extensions import assert_never
-
-from torchgen.model import (
-    BackendIndex,
-    BackendMetadata,
-    DispatchKey,
-    NativeFunction,
-    NativeFunctionsGroup,
-    OperatorName,
-)
-
-
-KERNEL_KEY_VERSION = 1
-
-
-# TODO: Duplicated Subset from codegen.tool.gen_oplist, remove declaration in codegen
-class ScalarType(IntEnum):
-    Byte = 0
-    Char = 1
-    Short = 2
-    Int = 3
-    Long = 4
-    Float = 6
-    Double = 7
-    Bool = 11
-
-
-ETParsedYaml = namedtuple("ETParsedYaml", ["native_functions", "kernel_index"])
-
-
-@dataclass(frozen=True)
-class ETKernelKeyOpArgMeta:
-    arg_name: str
-    dtype: str
-    # The order of the dimensions if entry is a Tensor
-    dim_order: tuple[int, ...]
-
-    def to_native_string(self) -> str:
-        dtype_str = ScalarType[self.dtype].value
-        dim_str = str(self.dim_order)[1:-1].replace(" ", "")
-        return f"{dtype_str};{dim_str}"
-
-
-@dataclass(frozen=True)
-class ETKernelKey:
-    # Field undefined is default = True
-    arg_meta: tuple[ETKernelKeyOpArgMeta, ...] = ()
-
-    # Indicator for this kernel being used as a catch all
-    default: bool = False
-
-    version: int = KERNEL_KEY_VERSION
-
-    @staticmethod
-    def gen_from_yaml(
-        args: dict[str, tuple[str, str]],
-        type_alias_map: dict[str, list[str]],  # TODO: Support unwrapped str val
-        dim_order_alias_map: dict[str, list[int]],
-    ) -> list[ETKernelKey]:
-        """Generate ETKernelKeys from arg kernel specs
-        Multiple ETKernelKeys are returned due to dtype permutations from utilizing
-        type_alias_map (actualizing each potential type permutation as a KernelKey)
-
-        Args:
-            args: Mapping from argument name to kernel specs
-                Kernel specs are a tuple of (dtype, dim_order).
-                Currently tuple entries must be aliased via the alias map arguments
-            type_alias_map: Mapping from type alias to potential type enums
-                i.e { T0 : [Double, Int] } means T0 can be either Double or Int
-                Used for lookup by args
-            dim_order_alias_map: Mapping from alias to a list of dimension orders
-                Used for lookup by args
-        """
-        # Cast to dim order to int
-        dim_order_alias_map = {
-            k: [int(alias) for alias in v] for k, v in dim_order_alias_map.items()
-        }
-        kernel_keys = []
-
-        # Get all used Dtype Alias
-        dtype_alias_used = set()
-        for type_alias, dim_order in args.values():
-            # Enforce usage of alias initially
-            # TODO: Support inlined arguments
-            assert type_alias in type_alias_map, "Undefined type alias: " + str(
-                type_alias
-            )
-            assert dim_order in dim_order_alias_map, (
-                f"Undefined dim_order alias: {dim_order}"
-            )
-            dtype_alias_used.add(type_alias)
-
-        # Generate all permutations of dtype alias values
-        alias_dtypes = [
-            [(alias, dtype) for dtype in type_alias_map[alias]]
-            for alias in dtype_alias_used
-        ]
-        alias_permutations = [
-            dict(permutation) for permutation in list(itertools.product(*alias_dtypes))
-        ]
-
-        # Using each alias value permutation, generate kernel keys
-        op_arg_cache = {}
-        for permutation in alias_permutations:
-            arg_list = []
-            for arg_name, arg_spec in args.items():
-                dtype = permutation[arg_spec[0]]
-                dim_order = dim_order_alias_map[arg_spec[1]]  # type: ignore[assignment]
-                if (
-                    cache_key := (arg_name, dtype, tuple(dim_order))
-                ) not in op_arg_cache:
-                    op_arg_cache[cache_key] = ETKernelKeyOpArgMeta(*cache_key)  # type: ignore[arg-type]
-
-                arg_list.append(op_arg_cache[cache_key])
-            kernel_keys.append(ETKernelKey(tuple(arg_list)))
-
-        return kernel_keys
-
-    def to_native_string(self) -> str:
-        if self.default:
-            return "default"
-        return (
-            "v"
-            + str(KERNEL_KEY_VERSION)
-            + "/"
-            + "|".join([arg.to_native_string() for arg in self.arg_meta])
-        )
-
-
-@dataclass(frozen=True)
-class ETKernelIndex:
-    index: dict[OperatorName, dict[ETKernelKey, BackendMetadata]]
-
-    def has_kernels(self, g: NativeFunction | NativeFunctionsGroup) -> bool:
-        m = self.get_kernels(g)
-        return m is not None
-
-    def get_kernels(
-        self, g: NativeFunction | NativeFunctionsGroup
-    ) -> dict[ETKernelKey, BackendMetadata]:
-        if isinstance(g, NativeFunction):
-            f = g
-        elif isinstance(g, NativeFunctionsGroup):
-            f = g.functional
-        else:
-            assert_never(g)
-        if f.func.name not in self.index:
-            return {}
-        return self.index[f.func.name]
-
-    @staticmethod
-    def grow_from_backend_indices(
-        kernel_index: dict[OperatorName, dict[ETKernelKey, BackendMetadata]],
-        backend_indices: dict[DispatchKey, dict[OperatorName, BackendMetadata]],
-    ) -> None:
-        for dk in backend_indices:
-            index = backend_indices[dk]
-            for op, backend_metadata in index.items():
-                if op in kernel_index:
-                    kernel_index[op][ETKernelKey(default=True)] = backend_metadata
-                else:
-                    kernel_index[op] = {ETKernelKey(default=True): backend_metadata}
-
-    @staticmethod
-    def from_backend_indices(
-        backend_indices: dict[DispatchKey, dict[OperatorName, BackendMetadata]],
-    ) -> ETKernelIndex:
-        kernel_index: dict[OperatorName, dict[ETKernelKey, BackendMetadata]] = (
-            defaultdict(dict)
-        )
-        ETKernelIndex.grow_from_backend_indices(kernel_index, backend_indices)
-        return ETKernelIndex(kernel_index)
-
-    def grow(
-        self, backend_indices: dict[DispatchKey, dict[OperatorName, BackendMetadata]]
-    ) -> ETKernelIndex:
-        ETKernelIndex.grow_from_backend_indices(self.index, backend_indices)
-        return self
-
-    def _to_backend_index(self) -> BackendIndex:
-        """
-        WARNING: this will be deprecated once all the codegen places know how to handle ETKernelIndex.
-        """
-        index: dict[OperatorName, BackendMetadata] = {}
-        for op in self.index:
-            kernel_dict = self.index[op]
-            assert len(kernel_dict.values()) == 1, (
-                f"Can't convert ETKernelIndex to BackendIndex because {op} has more than one kernels. Got {kernel_dict}"
-            )
-            index[op] = kernel_dict.get(
-                ETKernelKey(default=True),
-                BackendMetadata(kernel="", structured=False, cpp_namespace=""),
-            )
-        return BackendIndex(
-            dispatch_key=DispatchKey.CPU,
-            use_out_as_primary=False,
-            device_guard=False,
-            external=False,
-            index=index,
-        )
-
-    # Note duplicate ETKernelKey from index_b will clobber the metadata from index_a
-    @staticmethod
-    def merge_indices(index_a: ETKernelIndex, index_b: ETKernelIndex) -> ETKernelIndex:
-        combined = defaultdict(dict, index_a.index.copy())
-
-        for op, entry in index_b.index.items():
-            for key, metadata in entry.items():
-                combined[op][key] = metadata
-
-        return ETKernelIndex(combined)
diff --git a/torchgen/executorch/parse.py b/torchgen/executorch/parse.py
deleted file mode 100644
index 8095abd5b6b..00000000000
--- a/torchgen/executorch/parse.py
+++ /dev/null
@@ -1,153 +0,0 @@
-from __future__ import annotations
-
-from collections import defaultdict, namedtuple
-from typing import Any
-
-import yaml
-
-from torchgen.executorch.model import ETKernelIndex, ETKernelKey
-from torchgen.gen import LineLoader, parse_native_yaml
-from torchgen.model import (
-    BackendMetadata,
-    DispatchKey,
-    FunctionSchema,
-    NativeFunction,
-    OperatorName,
-)
-from torchgen.utils import NamespaceHelper
-
-
-# Parse native_functions.yaml into a sequence of NativeFunctions and ET Backend Indices.
-ETParsedYaml = namedtuple("ETParsedYaml", ["native_functions", "et_kernel_indices"])
-
-# Fields in native_functions.yaml used to determine which kernels should be used
-ET_FIELDS = ["kernels", "type_alias", "dim_order_alias"]
-
-
-def parse_from_yaml(ei: dict[str, object]) -> dict[ETKernelKey, BackendMetadata]:
-    """Given a loaded yaml representing kernel assignment information, extract the
-    mapping from `kernel keys` to `BackendMetadata` (the latter representing the kernel instance)
-
-    Args:
-        ei: Dict keys {kernels, type_alias, dim_order_alias}
-            See ETKernelKey for description of arguments
-    """
-    e = ei.copy()
-    if (kernels := e.pop("kernels", None)) is None:
-        return {}
-
-    type_alias: dict[str, list[str]] = e.pop("type_alias", {})  # type: ignore[assignment]
-    dim_order_alias: dict[str, list[str]] = e.pop("dim_order_alias", {})  # type: ignore[assignment]
-    dim_order_alias.pop("__line__", None)
-
-    kernel_mapping: dict[ETKernelKey, BackendMetadata] = {}
-
-    for entry in kernels:  # type: ignore[attr-defined]
-        arg_meta = entry.get("arg_meta")
-        if arg_meta is not None:
-            arg_meta.pop("__line__")
-
-        kernel_name = entry.get("kernel_name")
-        namespace_helper = NamespaceHelper.from_namespaced_entity(
-            kernel_name, max_level=3
-        )
-        kernel_namespace = namespace_helper.get_cpp_namespace(default="at")
-        backend_metadata = BackendMetadata(
-            kernel=namespace_helper.entity_name,
-            structured=False,
-            cpp_namespace=(kernel_namespace + "::native"),
-        )
-
-        kernel_keys = (
-            [ETKernelKey((), default=True)]
-            if arg_meta is None
-            else ETKernelKey.gen_from_yaml(arg_meta, type_alias, dim_order_alias)  # type: ignore[arg-type]
-        )
-
-        for kernel_key in kernel_keys:
-            assert kernel_key not in kernel_mapping, (
-                "Duplicate kernel key: " + str(kernel_key) + " " + str(e)
-            )
-            kernel_mapping[kernel_key] = backend_metadata
-
-    return kernel_mapping
-
-
-def parse_et_yaml_struct(es: object) -> ETKernelIndex:
-    """Given a loaded yaml representing a list of operators, for each op extract the mapping
-    of `kernel keys` to `BackendMetadata` (the latter representing the kernel instance
-    that should be used by the kernel key).
-    """
-    indices: dict[OperatorName, dict[ETKernelKey, BackendMetadata]] = {}
-    for ei in es:  # type: ignore[attr-defined]
-        e = ei.copy()
-
-        funcs = e.pop("func")
-        assert isinstance(funcs, str), f"not a str: {funcs}"
-        namespace_helper = NamespaceHelper.from_namespaced_entity(
-            namespaced_entity=funcs, max_level=1
-        )
-        opname = FunctionSchema.parse(namespace_helper.entity_name).name
-
-        assert opname not in indices, f"Duplicate func found in yaml: {opname} already"
-
-        if len(index := parse_from_yaml(e)) != 0:
-            indices[opname] = index
-
-    return ETKernelIndex(indices)
-
-
-def extract_kernel_fields(es: object) -> dict[OperatorName, dict[str, Any]]:
-    """Given a loaded yaml representing a list of operators, extract the
-    kernel key related fields indexed by the operator name.
-    """
-    fields: dict[OperatorName, dict[str, Any]] = defaultdict(dict)
-    for ei in es:  # type: ignore[attr-defined]
-        funcs = ei.get("func")
-        assert isinstance(funcs, str), f"not a str: {funcs}"
-        namespace_helper = NamespaceHelper.from_namespaced_entity(
-            namespaced_entity=funcs, max_level=1
-        )
-        opname = FunctionSchema.parse(namespace_helper.entity_name).name
-
-        for field in ET_FIELDS:
-            if (value := ei.get(field)) is not None:
-                fields[opname][field] = value
-
-    return fields
-
-
-def parse_et_yaml(
-    path: str,
-    tags_yaml_path: str,
-    ignore_keys: set[DispatchKey] | None = None,
-    skip_native_fns_gen: bool = False,
-) -> tuple[list[NativeFunction], dict[OperatorName, dict[str, Any]]]:
-    """Parse native_functions.yaml into NativeFunctions and an Operator Indexed Dict
-    of fields to persist from native_functions.yaml to functions.yaml
-    """
-    with open(path) as f:
-        es = yaml.load(f, Loader=LineLoader)
-
-    et_kernel = extract_kernel_fields(es)
-
-    # Remove ET specific fields from entries for BC compatibility
-    strip_et_fields(es)
-
-    native_yaml = parse_native_yaml(
-        path,
-        tags_yaml_path,
-        ignore_keys,
-        skip_native_fns_gen=skip_native_fns_gen,
-        loaded_yaml=es,
-    )
-    return native_yaml.native_functions, et_kernel
-
-
-def strip_et_fields(es: object) -> None:
-    """Given a loaded yaml representing a list of operators,
-    remove ET specific fields from every entries for BC compatibility
-    """
-    for entry in es:  # type: ignore[attr-defined]
-        for field in ET_FIELDS:
-            entry.pop(field, None)
diff --git a/torchgen/gen_executorch.py b/torchgen/gen_executorch.py
deleted file mode 100644
index 306333f1eae..00000000000
--- a/torchgen/gen_executorch.py
+++ /dev/null
@@ -1,1024 +0,0 @@
-from __future__ import annotations
-
-import argparse
-import os
-from collections import defaultdict
-from dataclasses import dataclass
-from pathlib import Path
-from typing import Any, Callable, TextIO, TYPE_CHECKING
-
-import yaml
-
-# Parse native_functions.yaml into a sequence of NativeFunctions and Backend Indices.
-from torchgen import dest
-from torchgen.api import cpp as aten_cpp
-from torchgen.api.types import CppSignature, CppSignatureGroup, CType, NamedCType
-from torchgen.context import (
-    method_with_native_function,
-    method_with_nested_native_function,
-    with_native_function_and_index,
-)
-from torchgen.executorch.api import et_cpp
-from torchgen.executorch.api.custom_ops import (
-    ComputeNativeFunctionStub,
-    gen_custom_ops_registration,
-)
-from torchgen.executorch.api.types import contextArg, ExecutorchCppSignature
-from torchgen.executorch.api.unboxing import Unboxing
-from torchgen.executorch.model import ETKernelIndex, ETKernelKey, ETParsedYaml
-from torchgen.executorch.parse import ET_FIELDS, parse_et_yaml, parse_et_yaml_struct
-from torchgen.gen import (
-    get_custom_build_selector,
-    get_native_function_declarations,
-    get_native_function_declarations_from_ns_grouped_kernels,
-    get_native_function_schema_registrations,
-    LineLoader,
-    parse_native_yaml,
-)
-from torchgen.model import (
-    BackendIndex,
-    BackendMetadata,
-    DEFAULT_KERNEL_NAMESPACE,
-    DispatchKey,
-    FunctionSchema,
-    Location,
-    NativeFunction,
-    NativeFunctionsGroup,
-    OperatorName,
-    Variant,
-)
-from torchgen.utils import (
-    context,
-    FileManager,
-    make_file_manager,
-    mapMaybe,
-    NamespaceHelper,
-)
-
-
-if TYPE_CHECKING:
-    from collections.abc import Sequence
-
-    from torchgen.selective_build.selector import SelectiveBuilder
-
-
-def _sig_decl_wrapper(sig: CppSignature | ExecutorchCppSignature) -> str:
-    """
-    A wrapper function to basically get `sig.decl(include_context=True)`.
-    For ATen kernel, the codegen has no idea about ET contextArg, so we
-    use this wrapper to add it.
-    """
-    if isinstance(sig, ExecutorchCppSignature):
-        return sig.decl()
-
-    returns_type = aten_cpp.returns_type(sig.func.returns).cpp_type()
-    cpp_args = [a.decl() for a in sig.arguments()]
-    cpp_args_str = ", ".join([contextArg.decl()] + cpp_args)
-    sig_decl = f"{returns_type} {sig.name()}({cpp_args_str})"
-    return sig_decl
-
-
-def static_dispatch(
-    sig: CppSignature | ExecutorchCppSignature,
-    f: NativeFunction,
-    backend_indices: list[BackendIndex],
-) -> str:
-    """
-    For a given `NativeFunction`, find out the corresponding native function and dispatch to it. If zero or more than one
-    native function exists, error out. A simplified version of register_dispatch_key.py
-    Arguments:
-        sig: A CppSignature for this native function we want to use.
-        f: NativeFunction to generate static dispatch.
-        backend_indices: All available backends.
-    Return:
-        C++ code to call backend-specific functions, e.g., "return at::native::add(self, other, scale);"
-    """
-    if len(backend_indices) == 0 or f.manual_kernel_registration:
-        return ""
-
-    backends = [b for b in backend_indices if b.has_kernel(f)]
-    static_block = None
-    if len(backends) == 1:
-        backend_metadata = backends[0].get_kernel(f)
-        if backend_metadata:
-            args = ", ".join(a.name for a in sig.arguments())
-            # Here we are assuming there's no difference between CppSignature and NativeSignature for Executorch.
-            static_block = f"return ::{backend_metadata.cpp_namespace}::{backend_metadata.kernel}({args});"
-    else:
-        static_block = f"""
-ET_ASSERT_UNREACHABLE_MSG("The number of native function(s) binding to {f.func.name} is {len(backends)}.");
-    """
-    return f"""
-// {f.namespace}::{f.func}
-TORCH_API inline {_sig_decl_wrapper(sig)} {{
-    {static_block}
-}}
-"""
-
-
-# Generates Functions.h, which provides the functional public C++ API,
-# and the scaffolding to call into the dispatcher from these functions.
-@dataclass(frozen=True)
-class ComputeFunction:
-    static_dispatch_backend_indices: list[BackendIndex]
-
-    selector: SelectiveBuilder
-
-    use_aten_lib: bool
-
-    is_custom_op: Callable[[NativeFunction], bool]
-
-    @method_with_native_function
-    def __call__(self, f: NativeFunction) -> str | None:
-        is_method_variant = False
-        if not self.selector.is_root_operator(f"{f.namespace}::{f.func.name}"):
-            return None
-
-        if Variant.function not in f.variants and Variant.method in f.variants:
-            is_method_variant = True
-
-        # only valid remaining case is only function is in f.variants
-        elif not (Variant.function in f.variants and Variant.method not in f.variants):
-            raise Exception(  # noqa: TRY002
-                f"Can't handle native function {f.func} with the following variant specification {f.variants}."
-            )
-
-        sig: CppSignature | ExecutorchCppSignature = (
-            CppSignatureGroup.from_native_function(
-                f, method=False, fallback_binding=f.manual_cpp_binding
-            ).most_faithful_signature()
-            if self.use_aten_lib
-            else ExecutorchCppSignature.from_native_function(f)
-        )
-        if self.use_aten_lib and not self.is_custom_op(f):
-            comma = ", "
-
-            if is_method_variant:
-                return f"""
-// {f.namespace}::{f.func}
-TORCH_API inline {_sig_decl_wrapper(sig)} {{
-    return {sig.arguments()[0].name}.{sig.name()}({comma.join(e.name for e in sig.arguments()[1:])});
-}}
-"""
-            else:
-                return f"""
-// {f.namespace}::{f.func}
-TORCH_API inline {_sig_decl_wrapper(sig)} {{
-    return at::{sig.name()}({comma.join(e.name for e in sig.arguments())});
-}}
-"""
-
-        else:
-            return static_dispatch(
-                sig,
-                f,
-                backend_indices=self.static_dispatch_backend_indices,
-            )
-
-
-# Generates RegisterCodegenUnboxedKernels.cpp.
-@dataclass(frozen=True)
-class ComputeCodegenUnboxedKernels:
-    selector: SelectiveBuilder
-
-    use_aten_lib: bool
-
-    add_exception_boundary: bool
-
-    @method_with_nested_native_function
-    def __call__(
-        self,
-        unbox_kernel_entry: tuple[NativeFunction, tuple[ETKernelKey, BackendMetadata]],
-    ) -> str:
-        f: NativeFunction = unbox_kernel_entry[0]
-        kernel_key: ETKernelKey | list[ETKernelKey] = unbox_kernel_entry[1][0]
-        kernel_meta: BackendMetadata = unbox_kernel_entry[1][1]
-
-        op_name = f"{f.namespace}::{f.func.name}"
-        if not self.selector.is_root_operator(op_name):
-            return ""
-
-        if not isinstance(kernel_key, list):
-            kernel_key = [kernel_key]
-        used_kernel_keys = self.selector.et_get_selected_kernels(
-            op_name, [k.to_native_string() for k in kernel_key]
-        )
-        if not used_kernel_keys:
-            return ""
-        sig: CppSignature | ExecutorchCppSignature
-        argument_type_gen: Callable[..., NamedCType]
-        return_type_gen: Callable[..., CType]
-        if self.use_aten_lib:
-            sig = CppSignatureGroup.from_native_function(
-                f, method=False, fallback_binding=f.manual_cpp_binding
-            ).most_faithful_signature()
-            argument_type_gen = aten_cpp.argumenttype_type
-            return_type_gen = aten_cpp.returns_type
-            arguments = sig.arguments()
-            kernel_call = f"torch::executor::{f.namespace}::{sig.name()}"
-        else:
-            sig = ExecutorchCppSignature.from_native_function(f)
-            argument_type_gen = et_cpp.argumenttype_type
-            return_type_gen = et_cpp.returns_type
-            arguments = sig.arguments(include_context=False)
-            kernel_call = f"{kernel_meta.cpp_namespace}::{kernel_meta.kernel}"
-        # parse arguments into C++ code
-        binding_list, code_list = Unboxing(
-            argument_type_gen=argument_type_gen
-        ).convert_arguments(arguments)
-
-        # for each C++ argument, generate the conversion code
-        code_connector = "\n\t"
-        arg_connector = ", "
-
-        args_str = f"{arg_connector.join(e.name for e in binding_list)}"
-        event_tracer_output_logging = ""
-        output_ids = []
-
-        if len(f.func.returns) == 0:
-            if len(f.func.arguments.out) == 0:
-                raise Exception(  # noqa: TRY002
-                    f"Can't handle native function {f.func} with no returns and no out yet."
-                )
-            out = f.func.arguments.out[0]
-            return_assignment = f"""stack[{len(binding_list)}] = &{out.name};"""
-            ret_prefix = ""
-            output_ids = [len(binding_list)]
-        else:
-            if len(f.func.arguments.out) == 0:
-                return_assignment = (
-                    f"""*stack[{len(binding_list)}] = EValue(result_);"""
-                )
-                ret_prefix = return_type_gen(f.func.returns).cpp_type() + " result_ = "
-                output_ids = [len(binding_list)]
-            else:
-                return_assignment = ""
-                ret_prefix = ""
-                output_ids = [
-                    len(binding_list) - (i + 1)
-                    for i in reversed(range(len(f.func.arguments.out)))
-                ]
-
-        for output_id in output_ids:
-            event_tracer_output_logging += (
-                f"internal::event_tracer_log_evalue("
-                f"context.internal_event_tracer(), "
-                f"*stack[{output_id}]);\n"
-            )
-
-        exception_boundary_begin = ""
-        exception_boundary_end = ""
-        if self.add_exception_boundary:
-            indent = " " * 8
-            exception_boundary_begin = indent + "try {"
-            exception_boundary_end = f"""{indent}}} catch (const std::exception& ex) {{
-{indent}  ET_LOG(Error, "Kernel threw an exception: %s", ex.what());
-{indent}  context.fail(torch::executor::Error::Internal);
-{indent}}}"""
-        newline = "\n    "
-        return "\n".join(
-            [
-                f"""
-Kernel(
-    "{f.namespace}::{f.func.name}",{newline + '"' + (k + '",') if k != "default" else ""}
-    []({contextArg.defn()}, EValue** stack) {{
-        {code_connector.join(code_list)}
-
-{exception_boundary_begin}
-        internal::EventTracerProfileOpScope event_tracer_op_scope(context.internal_event_tracer(), "native_call_{f.func.name}");
-        EXECUTORCH_SCOPE_PROF("native_call_{f.func.name}");
-        {ret_prefix}{kernel_call}(context, {args_str});
-        {event_tracer_output_logging}
-        {return_assignment}
-{exception_boundary_end}
-    }}
-),
-"""
-                for k in used_kernel_keys
-            ]
-        )
-
-
-def gen_unboxing(
-    *,
-    native_functions: Sequence[NativeFunction],
-    cpu_fm: FileManager,
-    selector: SelectiveBuilder,
-    use_aten_lib: bool,
-    kernel_index: ETKernelIndex,
-    manual_registration: bool,
-    add_exception_boundary: bool = False,
-) -> None:
-    # Iterable type for write_sharded is a Tuple of (native_function, (kernel_key, metadata))
-    def key_func(
-        item: tuple[NativeFunction, tuple[ETKernelKey, BackendMetadata]],
-    ) -> str:
-        return item[0].root_name + ":" + item[1][0].to_native_string()
-
-    items: list[tuple[NativeFunction, tuple[ETKernelKey, BackendMetadata]]] = [
-        (native_function, (kernel_key, metadata))
-        for native_function in native_functions
-        for kernel_key, metadata in kernel_index.get_kernels(native_function).items()
-    ]
-
-    header = ["Functions.h" if use_aten_lib else "NativeFunctions.h"]
-    filename = (
-        "RegisterKernels.cpp"
-        if manual_registration
-        else "RegisterCodegenUnboxedKernels.cpp"
-    )
-    cpu_fm.write_sharded(
-        filename,
-        items,
-        key_fn=key_func,
-        env_callable=lambda unbox_kernel_entry: {
-            "unboxed_kernels": [
-                ComputeCodegenUnboxedKernels(
-                    selector, use_aten_lib, add_exception_boundary
-                )(unbox_kernel_entry)
-            ],
-            "fn_header": header
-            if unbox_kernel_entry == items[0]
-            else [],  # Only write header once
-        },
-        num_shards=1,
-        sharded_keys={"unboxed_kernels", "fn_header"},
-    )
-
-
-@with_native_function_and_index  # type: ignore[arg-type]
-def compute_native_function_declaration(
-    g: NativeFunctionsGroup | NativeFunction, kernel_index: ETKernelIndex
-) -> list[str]:
-    assert isinstance(g, NativeFunction)
-    sig = ExecutorchCppSignature.from_native_function(f=g)
-    metadata_list = kernel_index.get_kernels(g).values()
-    if metadata_list is None:
-        return []
-
-    # for kernels in lean mode, we declare two versions, one with context and one without.
-    # In the end we will cleanup the unused one.
-    def gen_decl(metadata: BackendMetadata, include_context: bool) -> str:
-        return f"{sig.decl(name=metadata.kernel, include_context=include_context)};"
-
-    return [
-        gen_decl(metadata, include_context)
-        for include_context in [False, True]
-        for metadata in metadata_list
-    ]
-
-
-def gen_functions_declarations(
-    *,
-    native_functions: Sequence[NativeFunction],
-    kernel_index: ETKernelIndex,
-    selector: SelectiveBuilder,
-    use_aten_lib: bool,
-    custom_ops_native_functions: Sequence[NativeFunction] | None = None,
-) -> str:
-    """
-    Generates namespace separated C++ function API inline declaration/definitions.
-    Native functions are grouped by namespaces and the generated code is wrapped inside
-    namespace blocks.
-
-    E.g., for `custom_1::foo.out` in yaml file we will generate a C++ API as a symbol
-    in `torch::executor::custom_1::foo_out`. This way we avoid symbol conflict when
-    the other `custom_2::foo.out` is available.
-    """
-
-    # convert kernel index to BackendIndex. This is because we can't handle ETKernelIndex yet.
-    # TODO larryliu: evaluate if this code is still needed. If yes let it handle ETKernelIndex.
-
-    backend_index = kernel_index._to_backend_index()
-
-    ns_grouped_functions = defaultdict(list)
-    for native_function in native_functions:
-        ns_grouped_functions[native_function.namespace].append(native_function)
-    functions_declarations = ""
-    newline = "\n"
-    for namespace in ns_grouped_functions:
-        ns_helper = NamespaceHelper(
-            namespace_str=namespace,
-            entity_name="",
-            max_level=3,
-        )
-        declarations = list(
-            mapMaybe(
-                ComputeFunction(
-                    static_dispatch_backend_indices=[backend_index],
-                    selector=selector,
-                    use_aten_lib=use_aten_lib,
-                    is_custom_op=lambda f: custom_ops_native_functions is not None
-                    and f in custom_ops_native_functions,
-                ),
-                ns_grouped_functions[namespace],
-            )
-        )
-        functions_declarations += f"""
-{ns_helper.prologue}
-{newline.join(declarations)}
-{ns_helper.epilogue}
-        """
-    return functions_declarations
-
-
-def get_ns_grouped_kernels(
-    *,
-    native_functions: Sequence[NativeFunction],
-    kernel_index: ETKernelIndex,
-    native_function_decl_gen: Callable[
-        [
-            NativeFunctionsGroup | NativeFunction,
-            ETKernelIndex,
-        ],
-        list[str],
-    ],
-) -> dict[str, list[str]]:
-    ns_grouped_kernels: dict[str, list[str]] = defaultdict(list)
-    for f in native_functions:
-        native_function_namespaces = set()
-        op_kernels = kernel_index.get_kernels(f)
-        for backend_metadata in op_kernels.values():
-            if backend_metadata:
-                namespace = backend_metadata.cpp_namespace
-                native_function_namespaces.add(namespace)
-            else:
-                namespace = DEFAULT_KERNEL_NAMESPACE
-            assert len(native_function_namespaces) <= 1, (
-                f"Codegen only supports one namespace per operator, got {native_function_namespaces}"
-            )
-            ns_grouped_kernels[namespace].extend(
-                native_function_decl_gen(f, kernel_index)
-            )
-    return ns_grouped_kernels
-
-
-def gen_headers(
-    *,
-    native_functions: Sequence[NativeFunction],
-    gen_custom_ops_header: bool,
-    custom_ops_native_functions: Sequence[NativeFunction],
-    selector: SelectiveBuilder,
-    kernel_index: ETKernelIndex,
-    cpu_fm: FileManager,
-    use_aten_lib: bool,
-) -> None:
-    """Generate headers.
-
-    Args:
-        native_functions (Sequence[NativeFunction]): a collection of NativeFunction for ATen ops.
-        gen_custom_ops_header (bool): whether we should generate CustomOpsNativeFunctions.h
-        custom_ops_native_functions (Sequence[NativeFunction]): a collection of NativeFunction for custom ops.
-        kernel_index (ETKernelIndex): kernel collection
-        cpu_fm (FileManager): file manager manages output stream
-        use_aten_lib (bool): whether we are generating for PyTorch types or Executorch types.
-    """
-    aten_headers = ["#include <ATen/Functions.h>"]
-    backend_indices = {DispatchKey.CPU: kernel_index._to_backend_index()}
-    if gen_custom_ops_header:
-        cpu_fm.write_with_template(
-            "CustomOpsNativeFunctions.h",
-            "NativeFunctions.h",
-            lambda: {
-                "nativeFunctions_declarations": get_native_function_declarations(
-                    grouped_native_functions=custom_ops_native_functions,
-                    backend_indices=backend_indices,
-                    native_function_decl_gen=dest.compute_native_function_declaration,
-                ),
-                "headers": [
-                    "#include <ATen/ATen.h>",
-                    "#include <torch/torch.h>",
-                ],
-            },
-        )
-        aten_headers.append('#include "CustomOpsNativeFunctions.h"')
-    cpu_fm.write(
-        "Functions.h",
-        lambda: {
-            "static_dispatch_extra_headers": aten_headers
-            if use_aten_lib
-            else ['#include "NativeFunctions.h"'],
-            "Functions_declarations": gen_functions_declarations(
-                native_functions=native_functions,
-                kernel_index=kernel_index,
-                selector=selector,
-                use_aten_lib=use_aten_lib,
-                custom_ops_native_functions=custom_ops_native_functions,
-            ),
-        },
-    )
-    cpu_fm.write(
-        "RegisterKernels.h",
-        lambda: {
-            "generated_comment": "@" + "generated by torchgen/gen_executorch.py",
-        },
-    )
-    headers = {
-        "headers": [
-            "#include <executorch/runtime/core/exec_aten/exec_aten.h> // at::Tensor etc.",
-            "#include <executorch/runtime/kernel/kernel_runtime_context.h>",
-        ],
-    }
-    if use_aten_lib:
-        headers["headers"].append("#include <executorch/codegen/macros.h> // TORCH_API")
-        cpu_fm.write(
-            "NativeFunctions.h",
-            lambda: dict(
-                {
-                    "nativeFunctions_declarations": get_native_function_declarations(
-                        grouped_native_functions=native_functions,
-                        backend_indices=backend_indices,
-                        native_function_decl_gen=dest.compute_native_function_declaration,
-                    ),
-                },
-                **headers,
-            ),
-        )
-    else:
-        ns_grouped_kernels = get_ns_grouped_kernels(
-            native_functions=native_functions,
-            kernel_index=kernel_index,
-            native_function_decl_gen=compute_native_function_declaration,  # type: ignore[arg-type]
-        )
-        cpu_fm.write(
-            "NativeFunctions.h",
-            lambda: dict(
-                {
-                    "nativeFunctions_declarations": get_native_function_declarations_from_ns_grouped_kernels(
-                        ns_grouped_kernels=ns_grouped_kernels,
-                    ),
-                },
-                **headers,
-            ),
-        )
-
-
-def gen_custom_ops(
-    *,
-    native_functions: Sequence[NativeFunction],
-    selector: SelectiveBuilder,
-    kernel_index: ETKernelIndex,
-    cpu_fm: FileManager,
-    rocm: bool,
-) -> None:
-    dispatch_key = DispatchKey.CPU
-    (
-        anonymous_definition,
-        static_init_dispatch_registrations,
-    ) = gen_custom_ops_registration(
-        native_functions=native_functions,
-        selector=selector,
-        kernel_index=kernel_index,
-        rocm=rocm,
-    )
-    cpu_fm.write_with_template(
-        f"Register{dispatch_key}CustomOps.cpp",
-        "RegisterDispatchKeyCustomOps.cpp",
-        lambda: {
-            "ops_headers": '#include "CustomOpsNativeFunctions.h"',
-            "DispatchKey": dispatch_key,
-            "dispatch_namespace": dispatch_key.lower(),
-            "dispatch_namespaced_definitions": "",
-            "dispatch_anonymous_definitions": anonymous_definition,
-            "static_init_dispatch_registrations": static_init_dispatch_registrations,
-        },
-    )
-    cpu_fm.write_with_template(
-        f"Register{dispatch_key}Stub.cpp",
-        "RegisterDispatchKeyCustomOps.cpp",
-        lambda: {
-            "ops_headers": "",
-            "DispatchKey": dispatch_key,
-            "dispatch_namespace": dispatch_key.lower(),
-            "dispatch_namespaced_definitions": "",
-            "dispatch_anonymous_definitions": list(
-                mapMaybe(ComputeNativeFunctionStub(), native_functions)
-            ),
-            "static_init_dispatch_registrations": static_init_dispatch_registrations,
-        },
-    )
-
-    (
-        aten_schema_registrations,
-        schema_registrations,
-    ) = get_native_function_schema_registrations(
-        native_functions=native_functions,
-        schema_selector=selector,
-    )
-    cpu_fm.write(
-        "RegisterSchema.cpp",
-        lambda: {
-            "schema_registrations": schema_registrations,
-            "aten_schema_registrations": aten_schema_registrations,
-        },
-    )
-
-
-def translate_native_yaml(
-    tags_yaml_path: str,
-    aten_yaml_path: str,
-    native_yaml_path: str | None,
-    use_aten_lib: bool,
-    out_file: TextIO,
-) -> None:
-    """Translates Executorch DSL dialect to use the same syntax as
-    native_functions.yaml. The major difference is that Executorch DSL dialect
-    supports "op" key, where it refers to the operator name in native_functions.yaml.
-
-    For example, a functions.yaml may have the following entry:
-
-    - op: add.out
-      ...
-
-    It needs to be translated to the following:
-
-    - func: add.out(Tensor self, Tensor other, *, Scalar alpha=1, Tensor(a!) out) -> Tensor(a!)
-      ...
-
-    We go in aten_yaml_path and find the operator schema for "add.out" and add it
-    to the original functions.yaml. We also add required field "variants", where for
-    Executorch it will always be "function".
-
-    For ATen mode we don't have to do the translation because native_yaml_path is
-    the same as native_functions.yaml.
-
-    Args:
-        tags_yaml_path: Path to a tags.yaml file to satisfy codegen parsing.
-            It is not optional.
-        aten_yaml_path: Path to ATen operator yaml file native_functions.yaml.
-        native_yaml_path: Path to a functions.yaml file to parse.
-            If the path does not exist in the filesystem, it is treated as an
-            empty file. If `custom_ops_yaml_path` exists, the contents of that
-            file are appended to the yaml input to be parsed.
-        use_aten_lib: We use this flag to determine if we want to generate native
-            functions. In ATen mode we should generate out= variants.
-        out_file: The IO object that we are writing into.
-    Returns:
-        None
-    """
-    if use_aten_lib:
-        with open(aten_yaml_path) as aten_yaml:
-            out_file.writelines(aten_yaml.readlines())
-        return
-
-    native_functions, persisted_fields = parse_et_yaml(
-        aten_yaml_path,
-        tags_yaml_path,
-        None,
-        skip_native_fns_gen=False,
-    )
-
-    func_to_scoped_name: dict[FunctionSchema, str] = {
-        f.func: f"{f.namespace}::{f.func.name}" for f in native_functions
-    }
-    op_to_scoped_name: dict[OperatorName, str] = {
-        func.name: name for func, name in func_to_scoped_name.items()
-    }
-
-    schema_dict = {name: str(func) for func, name in func_to_scoped_name.items()}
-    kernel_persist_dict: dict[str, dict[str, Any]] = {
-        op_to_scoped_name[op]: v for op, v in persisted_fields.items()
-    }
-
-    if (
-        not native_yaml_path
-        or not os.path.exists(native_yaml_path)
-        or os.stat(native_yaml_path).st_size == 0
-    ):
-        return
-    with open(native_yaml_path) as native_yaml:
-        native_es = yaml.load(native_yaml, Loader=LineLoader)
-        if not native_es:
-            return
-        for e in native_es:
-            assert isinstance(e.get("__line__"), int), e
-            loc = Location(native_yaml_path, e.pop("__line__"))
-            with context(lambda: f"in {loc}:\n  "):
-                if "variants" not in e:
-                    e["variants"] = "function"
-                if "func" in e:
-                    continue
-                assert isinstance(e.get("op"), str), e
-                opname = e.pop("op")
-                if "::" not in opname:
-                    opname = "aten::" + opname
-                assert opname in schema_dict
-                e["func"] = schema_dict.get(opname)
-
-                # Write out persisted kernel information
-                if opname in kernel_persist_dict:
-                    for k, v in kernel_persist_dict[opname].items():
-                        e[k] = v
-
-        yaml.dump(native_es, out_file, width=1000)
-
-
-def parse_yaml(
-    path: str | None,
-    tags_yaml_path: str,
-    function_filter: Callable[[NativeFunction], bool],
-    skip_native_fns_gen: bool = False,
-) -> tuple[
-    list[NativeFunction],
-    dict[DispatchKey, dict[OperatorName, BackendMetadata]] | ETKernelIndex,
-]:
-    if path and os.path.exists(path) and os.stat(path).st_size > 0:
-        with open(path) as f:
-            es = yaml.load(f, Loader=LineLoader)
-
-        # Check for kernel index structure
-        kernel_index = (
-            parse_et_yaml_struct(es) if any("kernels" in e for e in es) else None
-        )
-
-        # Remove ET specific fields from entries for BC compatibility
-        for entry in es:
-            for field in ET_FIELDS:
-                entry.pop(field, None)
-
-        parsed_yaml = parse_native_yaml(
-            path,
-            tags_yaml_path,
-            None,
-            skip_native_fns_gen=skip_native_fns_gen,
-            loaded_yaml=es,
-        )
-        native_functions = list(filter(function_filter, parsed_yaml.native_functions))
-        op_names = [f.func.name for f in native_functions]
-
-        # (1) Return ETKernelIndex if kernel index is present
-        if kernel_index is not None:
-            filtered_index = {
-                op_name: kernel_mapping
-                for op_name, kernel_mapping in kernel_index.index.items()
-                if op_name in op_names
-            }
-            return native_functions, ETKernelIndex(index=filtered_index)
-
-        # (2) Return BackendIndices if kernel index is absent
-        def map_index(
-            m: dict[OperatorName, BackendMetadata],
-        ) -> dict[OperatorName, BackendMetadata]:
-            return {op: m[op] for op in m if op in op_names}
-
-        backend_indices = {
-            k: map_index(b.index) for (k, b) in parsed_yaml.backend_indices.items()
-        }
-
-        return native_functions, backend_indices
-    else:
-        return [], {}
-
-
-def parse_yaml_files(
-    tags_yaml_path: str,
-    aten_yaml_path: str,
-    native_yaml_path: str | None,
-    custom_ops_yaml_path: str | None,
-    selector: SelectiveBuilder,
-    use_aten_lib: bool,
-) -> tuple[ETParsedYaml, ETParsedYaml | None]:
-    """Parses functions.yaml and custom_ops.yaml files.
-
-    Args:
-        tags_yaml_path: Path to a tags.yaml file to satisfy codegen parsing.
-            It is not optional.
-        aten_yaml_path: Path to ATen operator yaml file native_functions.yaml.
-        native_yaml_path: Path to a functions.yaml file to parse.
-            If the path does not exist in the filesystem, it is treated as an
-            empty file. If `custom_ops_yaml_path` exists, the contents of that
-            file are appended to the yaml input to be parsed.
-        custom_ops_yaml_path: Path to a custom_ops.yaml file to parse. If
-            the path does not exist in the filesystem, it is ignored.
-        selector: For selective build.
-        use_aten_lib: We use this flag to determine if we want to generate native
-            functions. In ATen mode we should generate out= variants.
-    Returns:
-        A tuple with two elements:
-        [0]: The parsed results of concatenating the contents of
-             `native_yaml_path` and `custom_ops_yaml_path`.
-        [1]: The parsed results of the contents of `custom_ops_yaml_path`, if
-             present. If not present, None.
-    """
-    import tempfile
-
-    # only include selected ops, this is because we want to avoid
-    def function_filter(f: NativeFunction) -> bool:
-        return selector.is_native_function_selected(f)
-
-    with tempfile.TemporaryDirectory() as tmpdirname:
-        translated_yaml_path = os.path.join(tmpdirname, "translated.yaml")
-        with open(translated_yaml_path, "w") as translated:
-            translate_native_yaml(
-                tags_yaml_path,
-                aten_yaml_path,
-                native_yaml_path,
-                use_aten_lib,
-                translated,
-            )
-
-        translated_functions, translated_indices = parse_yaml(
-            translated_yaml_path, tags_yaml_path, function_filter, not use_aten_lib
-        )
-        custom_ops_functions, custom_ops_indices = parse_yaml(
-            custom_ops_yaml_path, tags_yaml_path, function_filter, True
-        )
-
-        # Convert BackendIndices to ETKernelIndex
-        if not isinstance(translated_indices, ETKernelIndex):
-            translated_indices = ETKernelIndex.from_backend_indices(translated_indices)
-        if not isinstance(custom_ops_indices, ETKernelIndex):
-            custom_ops_indices = ETKernelIndex.from_backend_indices(custom_ops_indices)
-
-        combined_functions = translated_functions + custom_ops_functions
-        combined_kernel_index = ETKernelIndex.merge_indices(
-            translated_indices, custom_ops_indices
-        )
-        combined_yaml = ETParsedYaml(combined_functions, combined_kernel_index)
-        custom_ops_parsed_yaml = ETParsedYaml(custom_ops_functions, custom_ops_indices)
-
-    return combined_yaml, custom_ops_parsed_yaml
-
-
-def main() -> None:
-    parser = argparse.ArgumentParser(description="Generate operator source files")
-    # Although we don't refer to --source-path directly, make_file_manager()
-    # expects it to point to a directory that contains a templates/ subdirectory
-    # containing the file templates.
-    parser.add_argument(
-        "-s",
-        "--source-path",
-        help="path to source directory for kernel templates",
-    )
-    parser.add_argument(
-        "--functions-yaml-path",
-        "--functions_yaml_path",
-        help="path to the functions.yaml file to use. Optional, but at least "
-        "one of --functions-yaml-path and --custom-ops-yaml-path must be "
-        "specified.",
-    )
-    parser.add_argument(
-        "--custom-ops-yaml-path",
-        "--custom_ops_yaml_path",
-        help="path to the custom_ops.yaml file to use. Optional, but at least "
-        "one of --functions-yaml-path and --custom-ops-yaml-path must be "
-        "specified.",
-    )
-    parser.add_argument(
-        "--aten-yaml-path",
-        "--aten_yaml_path",
-        help="path to native_functions.yaml file.",
-    )
-    # Note that make_file_manager() also looks at --install-dir.
-    parser.add_argument(
-        "-d",
-        "--install-dir",
-        "--install_dir",
-        help="output directory",
-        default="build/generated",
-    )
-    parser.add_argument(
-        "-o",
-        "--output-dependencies",
-        help="output a list of dependencies into the given file and exit",
-    )
-    # Although we don't refer to --dry-run directly, make_file_manager() looks
-    # for it.
-    parser.add_argument(
-        "--dry-run",
-        action="store_true",
-        help="run without writing any files (still updates outputs)",
-    )
-    parser.add_argument(
-        "--static-dispatch-backend",
-        "--static_dispatch_backend",
-        nargs="*",
-        help="generate static dispatch code for the specific backend (if set)",
-    )
-    parser.add_argument(
-        "--op-registration-whitelist",
-        "--op_registration_whitelist",
-        nargs="*",
-        help="filter op registrations by the whitelist (if set); "
-        "each item is `namespace`::`operator name` without overload name; "
-        "e.g.: aten::empty aten::conv2d ...",
-    )
-    parser.add_argument(
-        "--op-selection-yaml-path",
-        "--op_selection_yaml_path",
-        help="Provide a path to the operator selection (for custom build) YAML "
-        "that contains the information about the set of selected operators "
-        "and their categories (training, ...). Each operator is either a "
-        "full operator name with overload or just a bare operator name. "
-        "The operator names also contain the namespace prefix (e.g. aten::)",
-    )
-    parser.add_argument(
-        "--tags-path",
-        help="Path to tags.yaml. Required by yaml parsing in codegen system.",
-    )
-    parser.add_argument(
-        "--rocm",
-        action="store_true",
-        help="reinterpret CUDA as ROCm/HIP and adjust filepaths accordingly",
-    )
-    parser.add_argument(
-        "--use-aten-lib",
-        "--use_aten_lib",
-        action="store_true",
-        help="a boolean flag to indicate whether we use ATen kernels or not, in the future this flag will be per "
-        "operator",
-    )
-    parser.add_argument(
-        "--manual_registration",
-        "--manual-registration",
-        action="store_true",
-        help="a boolean flag to indicate whether we want to manually call"
-        "register_kernels() or rely on static init. ",
-    )
-    parser.add_argument(
-        "--generate",
-        type=str,
-        nargs="*",
-        choices=["headers", "sources"],
-        default=["headers", "sources"],
-        help="Generate only a subset of files",
-    )
-    parser.add_argument(
-        "--add-exception-boundary",
-        "--add_exception_boundary",
-        action="store_true",
-        help="whether to add a try/catch in the generated kernel wrapper to "
-        "convert exceptions to clean failures.",
-    )
-    options = parser.parse_args()
-    assert options.tags_path, "tags.yaml is required by codegen yaml parsing."
-
-    selector = get_custom_build_selector(
-        options.op_registration_whitelist,
-        options.op_selection_yaml_path,
-    )
-
-    parsed_yaml, custom_ops_parsed_yaml = parse_yaml_files(
-        aten_yaml_path=options.aten_yaml_path,
-        tags_yaml_path=options.tags_path,
-        native_yaml_path=options.functions_yaml_path,
-        custom_ops_yaml_path=options.custom_ops_yaml_path,
-        selector=selector,
-        use_aten_lib=options.use_aten_lib,
-    )
-    native_functions, kernel_index = (
-        parsed_yaml.native_functions,
-        parsed_yaml.kernel_index,
-    )
-    custom_ops_native_functions = (
-        custom_ops_parsed_yaml.native_functions if custom_ops_parsed_yaml else []
-    )
-
-    cpu_fm = make_file_manager(options=options)
-
-    if "headers" in options.generate:
-        # generate CustomOpsNativeFunctions.h when custom_ops.yaml is present, to match the build system.
-        gen_headers(
-            native_functions=native_functions,
-            gen_custom_ops_header=options.custom_ops_yaml_path,
-            custom_ops_native_functions=custom_ops_native_functions,
-            selector=selector,
-            kernel_index=kernel_index,
-            cpu_fm=cpu_fm,
-            use_aten_lib=options.use_aten_lib,
-        )
-
-    if "sources" in options.generate:
-        gen_unboxing(
-            native_functions=native_functions,
-            cpu_fm=cpu_fm,
-            selector=selector,
-            use_aten_lib=options.use_aten_lib,
-            kernel_index=kernel_index,
-            manual_registration=options.manual_registration,
-            add_exception_boundary=options.add_exception_boundary,
-        )
-        if custom_ops_native_functions:
-            gen_custom_ops(
-                native_functions=custom_ops_native_functions,
-                selector=selector,
-                kernel_index=kernel_index,
-                cpu_fm=cpu_fm,
-                rocm=options.rocm,
-            )
-
-    if options.output_dependencies:
-        depfile_path = Path(options.output_dependencies).resolve()
-        depfile_name = depfile_path.name
-        depfile_stem = depfile_path.stem
-
-        for fm, prefix in [
-            (cpu_fm, ""),
-        ]:
-            varname = prefix + depfile_stem
-            path = depfile_path.parent / (prefix + depfile_name)
-            fm.write_outputs(varname, str(path))
-
-
-if __name__ == "__main__":
-    main()