pytorch/tools/rules_cc/cuda_support.patch

diff --git cc/private/toolchain/unix_cc_configure.bzl cc/private/toolchain/unix_cc_configure.bzl
index ba992fc..e4e8364 100644
--- cc/private/toolchain/unix_cc_configure.bzl
+++ cc/private/toolchain/unix_cc_configure.bzl
@@ -27,6 +27,7 @@ load(
     "which",
     "write_builtin_include_directory_paths",
 )
+load("@rules_cuda//cuda:toolchain.bzl", "cuda_compiler_deps")
 
 def _field(name, value):
     """Returns properly indented top level crosstool field."""
@@ -397,7 +398,7 @@ def configure_unix_toolchain(repository_ctx, cpu_value, overriden_tools):
     cxx_opts = split_escaped(get_env_var(
         repository_ctx,
         "BAZEL_CXXOPTS",
-        "-std=c++0x",
+        "-std=c++17",
         False,
     ), ":")
 
@@ -463,7 +464,7 @@ def configure_unix_toolchain(repository_ctx, cpu_value, overriden_tools):
             )),
             "%{cc_compiler_deps}": get_starlark_list([":builtin_include_directory_paths"] + (
                 [":cc_wrapper"] if darwin else []
-            )),
+            ) + cuda_compiler_deps()),
             "%{cc_toolchain_identifier}": cc_toolchain_identifier,
             "%{compile_flags}": get_starlark_list(
                 [
diff --git cc/private/toolchain/unix_cc_toolchain_config.bzl cc/private/toolchain/unix_cc_toolchain_config.bzl
index c3cf3ba..1744eb4 100644
--- cc/private/toolchain/unix_cc_toolchain_config.bzl
+++ cc/private/toolchain/unix_cc_toolchain_config.bzl
@@ -25,6 +25,7 @@ load(
     "variable_with_value",
     "with_feature_set",
 )
+load("@rules_cuda//cuda:toolchain.bzl", "cuda_toolchain_config")
 
 all_compile_actions = [
     ACTION_NAMES.c_compile,
@@ -580,7 +581,8 @@ def _impl(ctx):
                 ],
                 flag_groups = [
                     flag_group(
-                        flags = ["-iquote", "%{quote_include_paths}"],
+                        # -isystem because there is an nvcc thing where it doesn't forward -iquote to host compiler.
+                        flags = ["-isystem", "%{quote_include_paths}"],
                         iterate_over = "quote_include_paths",
                     ),
                     flag_group(
@@ -1152,10 +1154,15 @@ def _impl(ctx):
             unfiltered_compile_flags_feature,
         ]
 
+    cuda = cuda_toolchain_config(
+        cuda_toolchain_info = ctx.attr._cuda_toolchain_info,
+        compiler_path = ctx.attr.tool_paths["gcc"],
+    )
+
     return cc_common.create_cc_toolchain_config_info(
         ctx = ctx,
-        features = features,
-        action_configs = action_configs,
+        features = features + cuda.features,
+        action_configs = action_configs + cuda.action_configs,
         cxx_builtin_include_directories = ctx.attr.cxx_builtin_include_directories,
         toolchain_identifier = ctx.attr.toolchain_identifier,
         host_system_name = ctx.attr.host_system_name,
@@ -1192,6 +1199,9 @@ cc_toolchain_config = rule(
         "tool_paths": attr.string_dict(),
         "toolchain_identifier": attr.string(mandatory = True),
         "unfiltered_compile_flags": attr.string_list(),
+        "_cuda_toolchain_info": attr.label(
+            default = Label("@rules_cuda//cuda:cuda_toolchain_info"),
+        ),
     },
     provides = [CcToolchainConfigInfo],
 )
[bazel] enable sccache+nvcc in CI (#95528) Fixes #79348 This change is mostly focused on enabling nvcc+sccache in the PyTorch CI. Along the way we had to do couple tweaks: 1. Split the rules_cc from the rules_cuda that embeeded them before. This is needed in order to apply a different patch to the rules_cc compare to the one that rules_cuda does by default. This is in turn needed because we need to workaround an nvcc behavior where it doesn't send `-iquote xxx` to the host compiler, but it does send `-isystem xxx`. So we workaround this problem with (ab)using `-isystem` instead. Without it we are getting errors like `xxx` is not found. 2. Workaround bug in bazel https://github.com/bazelbuild/bazel/issues/10167 that prevents us from using a straightforward and honest `nvcc` sccache wrapper. Instead we generate ad-hock bazel specific nvcc wrapper that has internal knowledge of the relative bazel paths to local_cuda. This allows us to workaround the issue with CUDA symlinks. Without it we are getting `undeclared inclusion(s) in rule` all over the place for CUDA headers. ## Test plan Green CI build https://github.com/pytorch/pytorch/actions/runs/4267147180/jobs/7428431740 Note that now it says "CUDA" in the sccache output ``` + sccache --show-stats Compile requests 9784 Compile requests executed 6726 Cache hits 6200 Cache hits (C/C++) 6131 Cache hits (CUDA) 69 Cache misses 519 Cache misses (C/C++) 201 Cache misses (CUDA) 318 Cache timeouts 0 Cache read errors 0 Forced recaches 0 Cache write errors 0 Compilation failures 0 Cache errors 7 Cache errors (C/C++) 7 Non-cacheable compilations 0 Non-cacheable calls 2893 Non-compilation calls 165 Unsupported compiler calls 0 Average cache write 0.116 s Average cache read miss 23.722 s Average cache read hit 0.057 s Failed distributed compilations 0 ``` Pull Request resolved: https://github.com/pytorch/pytorch/pull/95528 Approved by: https://github.com/huydhn 2023-02-28 03:51:08 +00:00			`diff --git cc/private/toolchain/unix_cc_configure.bzl cc/private/toolchain/unix_cc_configure.bzl`
			`index ba992fc..e4e8364 100644`
			`--- cc/private/toolchain/unix_cc_configure.bzl`
			`+++ cc/private/toolchain/unix_cc_configure.bzl`
			`@@ -27,6 +27,7 @@ load(`
			`"which",`
			`"write_builtin_include_directory_paths",`
			`)`
			`+load("@rules_cuda//cuda:toolchain.bzl", "cuda_compiler_deps")`

			`def _field(name, value):`
			`"""Returns properly indented top level crosstool field."""`
			`@@ -397,7 +398,7 @@ def configure_unix_toolchain(repository_ctx, cpu_value, overriden_tools):`
			`cxx_opts = split_escaped(get_env_var(`
			`repository_ctx,`
			`"BAZEL_CXXOPTS",`
			`- "-std=c++0x",`
[BE] Fix incompatible-std-redefinition warning (#141630) Fixes following warning during CUDA bazel builds ``` nvcc-real warning : incompatible redefinition for option 'std', the last value of this option was used ``` Pull Request resolved: https://github.com/pytorch/pytorch/pull/141630 Approved by: https://github.com/cyyever, https://github.com/kit1980 2024-11-27 05:06:34 +00:00			`+ "-std=c++17",`
[bazel] enable sccache+nvcc in CI (#95528) Fixes #79348 This change is mostly focused on enabling nvcc+sccache in the PyTorch CI. Along the way we had to do couple tweaks: 1. Split the rules_cc from the rules_cuda that embeeded them before. This is needed in order to apply a different patch to the rules_cc compare to the one that rules_cuda does by default. This is in turn needed because we need to workaround an nvcc behavior where it doesn't send `-iquote xxx` to the host compiler, but it does send `-isystem xxx`. So we workaround this problem with (ab)using `-isystem` instead. Without it we are getting errors like `xxx` is not found. 2. Workaround bug in bazel https://github.com/bazelbuild/bazel/issues/10167 that prevents us from using a straightforward and honest `nvcc` sccache wrapper. Instead we generate ad-hock bazel specific nvcc wrapper that has internal knowledge of the relative bazel paths to local_cuda. This allows us to workaround the issue with CUDA symlinks. Without it we are getting `undeclared inclusion(s) in rule` all over the place for CUDA headers. ## Test plan Green CI build https://github.com/pytorch/pytorch/actions/runs/4267147180/jobs/7428431740 Note that now it says "CUDA" in the sccache output ``` + sccache --show-stats Compile requests 9784 Compile requests executed 6726 Cache hits 6200 Cache hits (C/C++) 6131 Cache hits (CUDA) 69 Cache misses 519 Cache misses (C/C++) 201 Cache misses (CUDA) 318 Cache timeouts 0 Cache read errors 0 Forced recaches 0 Cache write errors 0 Compilation failures 0 Cache errors 7 Cache errors (C/C++) 7 Non-cacheable compilations 0 Non-cacheable calls 2893 Non-compilation calls 165 Unsupported compiler calls 0 Average cache write 0.116 s Average cache read miss 23.722 s Average cache read hit 0.057 s Failed distributed compilations 0 ``` Pull Request resolved: https://github.com/pytorch/pytorch/pull/95528 Approved by: https://github.com/huydhn 2023-02-28 03:51:08 +00:00			`False,`
			`), ":")`

			`@@ -463,7 +464,7 @@ def configure_unix_toolchain(repository_ctx, cpu_value, overriden_tools):`
			`)),`
			`"%{cc_compiler_deps}": get_starlark_list([":builtin_include_directory_paths"] + (`
			`[":cc_wrapper"] if darwin else []`
			`- )),`
			`+ ) + cuda_compiler_deps()),`
			`"%{cc_toolchain_identifier}": cc_toolchain_identifier,`
			`"%{compile_flags}": get_starlark_list(`
			`[`
			`diff --git cc/private/toolchain/unix_cc_toolchain_config.bzl cc/private/toolchain/unix_cc_toolchain_config.bzl`
			`index c3cf3ba..1744eb4 100644`
			`--- cc/private/toolchain/unix_cc_toolchain_config.bzl`
			`+++ cc/private/toolchain/unix_cc_toolchain_config.bzl`
			`@@ -25,6 +25,7 @@ load(`
			`"variable_with_value",`
			`"with_feature_set",`
			`)`
			`+load("@rules_cuda//cuda:toolchain.bzl", "cuda_toolchain_config")`

			`all_compile_actions = [`
			`ACTION_NAMES.c_compile,`
			`@@ -580,7 +581,8 @@ def _impl(ctx):`
			`],`
			`flag_groups = [`
			`flag_group(`
			`- flags = ["-iquote", "%{quote_include_paths}"],`
			`+ # -isystem because there is an nvcc thing where it doesn't forward -iquote to host compiler.`
			`+ flags = ["-isystem", "%{quote_include_paths}"],`
			`iterate_over = "quote_include_paths",`
			`),`
			`flag_group(`
			`@@ -1152,10 +1154,15 @@ def _impl(ctx):`
			`unfiltered_compile_flags_feature,`
			`]`

			`+ cuda = cuda_toolchain_config(`
			`+ cuda_toolchain_info = ctx.attr._cuda_toolchain_info,`
			`+ compiler_path = ctx.attr.tool_paths["gcc"],`
			`+ )`
			`+`
			`return cc_common.create_cc_toolchain_config_info(`
			`ctx = ctx,`
			`- features = features,`
			`- action_configs = action_configs,`
			`+ features = features + cuda.features,`
			`+ action_configs = action_configs + cuda.action_configs,`
			`cxx_builtin_include_directories = ctx.attr.cxx_builtin_include_directories,`
			`toolchain_identifier = ctx.attr.toolchain_identifier,`
			`host_system_name = ctx.attr.host_system_name,`
			`@@ -1192,6 +1199,9 @@ cc_toolchain_config = rule(`
			`"tool_paths": attr.string_dict(),`
			`"toolchain_identifier": attr.string(mandatory = True),`
			`"unfiltered_compile_flags": attr.string_list(),`
			`+ "_cuda_toolchain_info": attr.label(`
			`+ default = Label("@rules_cuda//cuda:cuda_toolchain_info"),`
			`+ ),`
			`},`
			`provides = [CcToolchainConfigInfo],`
			`)`