DeepRec-AI
diff --git a/‎tensorflow/compiler/jit/BUILD‎
Lines changed: 182 additions & 0 deletions b/‎tensorflow/compiler/jit/BUILD‎
Lines changed: 182 additions & 0 deletions
@@ -41,6 +41,8 @@ cc_library(
     ] + if_cuda([
         ":xla_gpu_device",
         ":xla_gpu_jit",
+        ":jit_cuda_graph_mode_passes",
+        "//tensorflow/compiler/jit/kernels:cuda_graph_mode_ops",
     ]),
     alwayslink = 1,
 )
@@ -327,6 +329,17 @@ cc_library(
     alwayslink = 1,
 )
 
+cc_library(
+    name = "jit_cuda_graph_mode_passes",
+    srcs = ["jit_cuda_graph_mode_pass_registration.cc"],
+    visibility = ["//visibility:public"],
+    deps = [
+        ":cuda_graph_mode_passes",
+        "//tensorflow/core:core_cpu_internal",
+    ] + tf_jit_compilation_passes_extra_deps(),
+    alwayslink = 1,
+)
+
 cc_library(
     name = "xla_kernel_creator",
     srcs = [
@@ -578,6 +591,93 @@ cc_library(
     ],
 )
 
+cc_library(
+    name = "cuda_graph_mode_passes",
+    srcs = [
+        "build_cuda_graph_mode_ops_pass.cc",
+        "clone_constants_for_better_clustering.cc",
+        "cluster_scoping_pass.cc",
+        "deadness_analysis.cc",
+        "deadness_analysis_internal.h",
+        "encapsulate_subgraphs_pass.cc",
+        "encapsulate_cuda_graph_mode_subgraphs_pass.cc",
+        "encapsulate_xla_computations_pass.cc",
+        "extract_outside_compilation_pass.cc",
+        "increase_dynamism_for_auto_jit_pass.cc",
+        "introduce_floating_point_jitter_pass.cc",
+        "mark_for_cuda_graph_mode_pass.cc",
+        "mark_for_cuda_graph_mode_pass_test_helper.cc",
+        "partially_decluster_pass.cc",
+        "report_clustering_info_pass.cc",
+        "async_io_conversion_pass.cc",
+    ],
+    hdrs = [
+        "build_cuda_graph_mode_ops_pass.h",
+        "clone_constants_for_better_clustering.h",
+        "cluster_scoping_pass.h",
+        "deadness_analysis.h",
+        "encapsulate_subgraphs_pass.h",
+        "encapsulate_cuda_graph_mode_subgraphs_pass.h",
+        "encapsulate_xla_computations_pass.h",
+        "extract_outside_compilation_pass.h",
+        "increase_dynamism_for_auto_jit_pass.h",
+        "introduce_floating_point_jitter_pass.h",
+        "mark_for_compilation_pass.h",
+        "mark_for_compilation_pass_test_helper.h",
+        "mark_for_cuda_graph_mode_pass.h",
+        "mark_for_cuda_graph_mode_pass_test_helper.h",
+        "partially_decluster_pass.h",
+        "report_clustering_info_pass.h",
+        "async_io_conversion_pass.h",
+    ],
+    deps = [
+        "compilability_check_util",
+        ":common",
+        ":device_util",
+        ":encapsulate_util",
+        ":flags",
+        ":resource_operation_safety_analysis",
+        ":shape_inference_helpers",
+        ":xla_activity_listener",
+        ":xla_cluster_util",
+        ":cuda_graph_mode_cluster_util",
+        "//tensorflow/cc:cc_ops",
+        "//tensorflow/cc:functional_ops",
+        "//tensorflow/cc:ops",
+        "//tensorflow/cc:scope",
+        "//tensorflow/cc:scope_internal",
+        "//tensorflow/compiler/jit/graphcycles",
+        "//tensorflow/compiler/jit/ops:xla_ops",
+        "//tensorflow/compiler/jit/ops:async_io_ops",
+        "//tensorflow/compiler/tf2xla:resource_operation_table",
+        "//tensorflow/compiler/tf2xla:side_effect_util",
+        "//tensorflow/compiler/tf2xla:tf2xla_util",
+        "//tensorflow/compiler/tf2xla:xla_compiler",
+        "//tensorflow/compiler/tf2xla/cc:xla_jit_ops",
+        "//tensorflow/compiler/tf2xla/cc:xla_ops",
+        "//tensorflow/compiler/xla:status_macros",
+        "//tensorflow/compiler/xla:statusor",
+        "//tensorflow/compiler/xla:union_find",
+        "//tensorflow/compiler/xla:util",
+        "//tensorflow/core:core_cpu",
+        "//tensorflow/core:core_cpu_internal",
+        "//tensorflow/core:framework",
+        "//tensorflow/core:framework_bounds_check",
+        "//tensorflow/core:graph",
+        "//tensorflow/core:lib",
+        "//tensorflow/core:lib_internal",
+        "//tensorflow/core:protos_all_cc",
+        "//tensorflow/stream_executor/lib",
+        "@com_google_absl//absl/algorithm:container",
+        "@com_google_absl//absl/container:flat_hash_map",
+        "@com_google_absl//absl/container:flat_hash_set",
+        "@com_google_absl//absl/container:inlined_vector",
+        "@com_google_absl//absl/memory",
+        "@com_google_absl//absl/strings",
+        "@com_google_absl//absl/types:optional",
+    ],
+)
+
 cc_library(
     name = "xla_cluster_util",
     srcs = ["xla_cluster_util.cc"],
@@ -603,6 +703,31 @@ cc_library(
     ],
 )
 
+cc_library(
+    name = "cuda_graph_mode_cluster_util",
+    srcs = ["cuda_graph_mode_cluster_util.cc"],
+    hdrs = ["cuda_graph_mode_cluster_util.h"],
+    deps = [
+        ":flags",
+        ":xla_activity_proto_cc",
+        "//tensorflow/compiler/jit/graphcycles",
+        "//tensorflow/compiler/xla:status_macros",
+        "//tensorflow/compiler/xla:statusor",
+        "//tensorflow/core:core_cpu",
+        "//tensorflow/core:framework",
+        "//tensorflow/core:framework_bounds_check",
+        "//tensorflow/core:graph",
+        "//tensorflow/core:protos_all_cc",
+        "//tensorflow/stream_executor/lib",
+        "@com_google_absl//absl/algorithm:container",
+        "@com_google_absl//absl/container:flat_hash_map",
+        "@com_google_absl//absl/container:flat_hash_set",
+        "@com_google_absl//absl/strings",
+        "@com_google_absl//absl/types:optional",
+        "@com_google_absl//absl/types:span",
+    ],
+)
+
 cc_library(
     name = "device_util",
     srcs = ["device_util.cc"],
@@ -738,6 +863,63 @@ tf_cc_test(
     ],
 )
 
+tf_cc_test(
+    name = "cuda_graph_mode_passes_test",
+    size = "small",
+    srcs = [
+        "mark_for_cuda_graph_mode_pass_test.cc",
+        "encapsulate_cuda_graph_mode_subgraphs_pass_test.cc",
+        "build_cuda_graph_mode_ops_pass_test.cc",
+    ],
+    # TODO(b/141643254) Re-enable msan after fixing use-of-uninitialized-value
+    # error.
+    tags = ["nomsan"] + tf_cuda_tests_tags(),
+    deps = [
+        ":common",
+        ":cuda_graph_mode_passes",
+        ":compilation_passes",
+        ":compilation_passes_test_main",
+        ":encapsulate_util",
+        ":flags",
+        ":node_matchers",
+        ":xla_cluster_util",
+        ":cuda_graph_mode_cluster_util",
+        ":xla_cpu_device",
+        ":xla_gpu_device",
+        "//tensorflow/cc:cc_ops",
+        "//tensorflow/cc:cc_ops_internal",
+        "//tensorflow/cc:function_ops",
+        "//tensorflow/cc:functional_ops",
+        "//tensorflow/cc:ops",
+        "//tensorflow/cc:resource_variable_ops",
+        "//tensorflow/cc:scope",
+        "//tensorflow/cc:sendrecv_ops",
+        "//tensorflow/compiler/jit/kernels:xla_ops",
+        "//tensorflow/compiler/jit/kernels:cuda_graph_mode_ops",
+        "//tensorflow/compiler/tf2xla:rearrange_function_argument",
+        "//tensorflow/compiler/tf2xla:side_effect_util",
+        "//tensorflow/compiler/tf2xla:test_util",
+        "//tensorflow/compiler/tf2xla:xla_compiler",
+        "//tensorflow/compiler/tf2xla/cc:xla_jit_ops",
+        "//tensorflow/compiler/tf2xla/cc:xla_ops",
+        "//tensorflow/compiler/tf2xla/kernels:xla_dummy_ops",
+        "//tensorflow/compiler/tf2xla/kernels:xla_ops",
+        "//tensorflow/compiler/xla:test",
+        "//tensorflow/core:core_cpu",
+        "//tensorflow/core:framework",
+        "//tensorflow/core:framework_internal",
+        "//tensorflow/core:lib",
+        "//tensorflow/core:protos_all_cc",
+        "//tensorflow/core:session_options",
+        "//tensorflow/core:test",
+        "//tensorflow/core:testlib",
+        "@com_google_absl//absl/container:flat_hash_map",
+        "@com_google_absl//absl/memory",
+        "@com_google_absl//absl/strings",
+        "@com_google_absl//absl/types:span",
+    ],
+)
+
 tf_cc_test(
     name = "xla_cluster_util_test",
     size = "small",